2017-02-23 06:26:44 +08:00
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
< html xmlns = "http://www.w3.org/1999/xhtml" >
< head >
< meta http-equiv = "Content-Type" content = "text/xhtml;charset=UTF-8" / >
< meta http-equiv = "X-UA-Compatible" content = "IE=9" / >
< meta name = "generator" content = "Doxygen 1.8.5" / >
2019-05-28 22:17:22 +08:00
< title > Faiss: /data/users/hoss/faiss/gpu/GpuIndex.cu Source File< / title >
2017-02-23 06:26:44 +08:00
< link href = "tabs.css" rel = "stylesheet" type = "text/css" / >
< script type = "text/javascript" src = "jquery.js" > < / script >
< script type = "text/javascript" src = "dynsections.js" > < / script >
< link href = "search/search.css" rel = "stylesheet" type = "text/css" / >
< script type = "text/javascript" src = "search/search.js" > < / script >
< script type = "text/javascript" >
$(document).ready(function() { searchBox.OnSelectItem(0); });
< / script >
< link href = "doxygen.css" rel = "stylesheet" type = "text/css" / >
< / head >
< body >
< div id = "top" > <!-- do not remove this div, it is closed by doxygen! -->
< div id = "titlearea" >
< table cellspacing = "0" cellpadding = "0" >
< tbody >
< tr style = "height: 56px;" >
< td style = "padding-left: 0.5em;" >
< div id = "projectname" > Faiss
< / div >
< / td >
< / tr >
< / tbody >
< / table >
< / div >
<!-- end header part -->
<!-- Generated by Doxygen 1.8.5 -->
< script type = "text/javascript" >
var searchBox = new SearchBox("searchBox", "search",false,'Search');
< / script >
< div id = "navrow1" class = "tabs" >
< ul class = "tablist" >
< li > < a href = "index.html" > < span > Main  Page< / span > < / a > < / li >
< li > < a href = "namespaces.html" > < span > Namespaces< / span > < / a > < / li >
< li > < a href = "annotated.html" > < span > Classes< / span > < / a > < / li >
< li class = "current" > < a href = "files.html" > < span > Files< / span > < / a > < / li >
< li >
< div id = "MSearchBox" class = "MSearchBoxInactive" >
< span class = "left" >
< img id = "MSearchSelect" src = "search/mag_sel.png"
onmouseover="return searchBox.OnSearchSelectShow()"
onmouseout="return searchBox.OnSearchSelectHide()"
alt=""/>
< input type = "text" id = "MSearchField" value = "Search" accesskey = "S"
onfocus="searchBox.OnSearchFieldFocus(true)"
onblur="searchBox.OnSearchFieldFocus(false)"
onkeyup="searchBox.OnSearchFieldChange(event)"/>
< / span > < span class = "right" >
< a id = "MSearchClose" href = "javascript:searchBox.CloseResultsWindow()" > < img id = "MSearchCloseImg" border = "0" src = "search/close.png" alt = "" / > < / a >
< / span >
< / div >
< / li >
< / ul >
< / div >
< div id = "navrow2" class = "tabs2" >
< ul class = "tablist" >
< li > < a href = "files.html" > < span > File  List< / span > < / a > < / li >
< / ul >
< / div >
<!-- window showing the filter options -->
< div id = "MSearchSelectWindow"
onmouseover="return searchBox.OnSearchSelectShow()"
onmouseout="return searchBox.OnSearchSelectHide()"
onkeydown="return searchBox.OnSearchSelectKey(event)">
< a class = "SelectItem" href = "javascript:void(0)" onclick = "searchBox.OnSelectItem(0)" > < span class = "SelectionMark" >   < / span > All< / a > < a class = "SelectItem" href = "javascript:void(0)" onclick = "searchBox.OnSelectItem(1)" > < span class = "SelectionMark" >   < / span > Classes< / a > < a class = "SelectItem" href = "javascript:void(0)" onclick = "searchBox.OnSelectItem(2)" > < span class = "SelectionMark" >   < / span > Namespaces< / a > < a class = "SelectItem" href = "javascript:void(0)" onclick = "searchBox.OnSelectItem(3)" > < span class = "SelectionMark" >   < / span > Functions< / a > < a class = "SelectItem" href = "javascript:void(0)" onclick = "searchBox.OnSelectItem(4)" > < span class = "SelectionMark" >   < / span > Variables< / a > < a class = "SelectItem" href = "javascript:void(0)" onclick = "searchBox.OnSelectItem(5)" > < span class = "SelectionMark" >   < / span > Typedefs< / a > < a class = "SelectItem" href = "javascript:void(0)" onclick = "searchBox.OnSelectItem(6)" > < span class = "SelectionMark" >   < / span > Enumerations< / a > < a class = "SelectItem" href = "javascript:void(0)" onclick = "searchBox.OnSelectItem(7)" > < span class = "SelectionMark" >   < / span > Enumerator< / a > < a class = "SelectItem" href = "javascript:void(0)" onclick = "searchBox.OnSelectItem(8)" > < span class = "SelectionMark" >   < / span > Friends< / a > < / div >
<!-- iframe showing the search results (closed by default) -->
< div id = "MSearchResultsWindow" >
< iframe src = "javascript:void(0)" frameborder = "0"
name="MSearchResults" id="MSearchResults">
< / iframe >
< / div >
< div id = "nav-path" class = "navpath" >
< ul >
2019-05-28 22:17:22 +08:00
< li class = "navelem" > < a class = "el" href = "dir_5956a3e80a20e8e03eb577bedb92689f.html" > gpu< / a > < / li > < / ul >
2017-02-23 06:26:44 +08:00
< / div >
< / div > <!-- top -->
< div class = "header" >
< div class = "headertitle" >
< div class = "title" > GpuIndex.cu< / div > < / div >
< / div > <!-- header -->
< div class = "contents" >
2017-06-21 21:54:28 +08:00
< div class = "fragment" > < div class = "line" > < a name = "l00001" > < / a > < span class = "lineno" > 1< / span >   < span class = "comment" > /**< / span > < / div >
2019-05-28 22:17:22 +08:00
< div class = "line" > < a name = "l00002" > < / a > < span class = "lineno" > 2< / span >   < span class = "comment" > * Copyright (c) Facebook, Inc. and its affiliates.< / span > < / div >
< div class = "line" > < a name = "l00003" > < / a > < span class = "lineno" > 3< / span >   < span class = "comment" > *< / span > < / div >
< div class = "line" > < a name = "l00004" > < / a > < span class = "lineno" > 4< / span >   < span class = "comment" > * This source code is licensed under the MIT license found in the< / span > < / div >
< div class = "line" > < a name = "l00005" > < / a > < span class = "lineno" > 5< / span >   < span class = "comment" > * LICENSE file in the root directory of this source tree.< / span > < / div >
< div class = "line" > < a name = "l00006" > < / a > < span class = "lineno" > 6< / span >   < span class = "comment" > */< / span > < / div >
< div class = "line" > < a name = "l00007" > < / a > < span class = "lineno" > 7< / span >   < / div >
2017-06-21 21:54:28 +08:00
< div class = "line" > < a name = "l00008" > < / a > < span class = "lineno" > 8< / span >   < / div >
2019-05-28 22:17:22 +08:00
< div class = "line" > < a name = "l00009" > < / a > < span class = "lineno" > 9< / span >   < span class = "preprocessor" > #include " GpuIndex.h" < / span > < / div >
< div class = "line" > < a name = "l00010" > < / a > < span class = "lineno" > 10< / span >   < span class = "preprocessor" > #include " ../FaissAssert.h" < / span > < / div >
< div class = "line" > < a name = "l00011" > < / a > < span class = "lineno" > 11< / span >   < span class = "preprocessor" > #include " GpuResources.h" < / span > < / div >
< div class = "line" > < a name = "l00012" > < / a > < span class = "lineno" > 12< / span >   < span class = "preprocessor" > #include " utils/CopyUtils.cuh" < / span > < / div >
2018-12-20 00:48:35 +08:00
< div class = "line" > < a name = "l00013" > < / a > < span class = "lineno" > 13< / span >   < span class = "preprocessor" > #include " utils/DeviceUtils.h" < / span > < / div >
2019-05-28 22:17:22 +08:00
< div class = "line" > < a name = "l00014" > < / a > < span class = "lineno" > 14< / span >   < span class = "preprocessor" > #include " utils/StaticUtils.h" < / span > < / div >
< div class = "line" > < a name = "l00015" > < / a > < span class = "lineno" > 15< / span >   < span class = "preprocessor" > #include < limits> < / span > < / div >
< div class = "line" > < a name = "l00016" > < / a > < span class = "lineno" > 16< / span >   < span class = "preprocessor" > #include < memory> < / span > < / div >
2018-12-20 00:48:35 +08:00
< div class = "line" > < a name = "l00017" > < / a > < span class = "lineno" > 17< / span >   < / div >
2019-05-28 22:17:22 +08:00
< div class = "line" > < a name = "l00018" > < / a > < span class = "lineno" > 18< / span >   < span class = "keyword" > namespace < / span > faiss { < span class = "keyword" > namespace < / span > gpu {< / div >
< div class = "line" > < a name = "l00019" > < / a > < span class = "lineno" > 19< / span >   < span class = "comment" > < / span > < / div >
< div class = "line" > < a name = "l00020" > < / a > < span class = "lineno" > 20< / span >   < span class = "comment" > /// Default CPU search size for which we use paged copies< / span > < / div >
< div class = "line" > < a name = "l00021" > < / a > < span class = "lineno" > 21< / span >   < span class = "comment" > < / span > constexpr < span class = "keywordtype" > size_t< / span > kMinPageSize = (size_t) 256 * 1024 * 1024;< / div >
< div class = "line" > < a name = "l00022" > < / a > < span class = "lineno" > 22< / span >   < span class = "comment" > < / span > < / div >
< div class = "line" > < a name = "l00023" > < / a > < span class = "lineno" > 23< / span >   < span class = "comment" > /// Size above which we page copies from the CPU to GPU (non-paged< / span > < / div >
< div class = "line" > < a name = "l00024" > < / a > < span class = "lineno" > 24< / span >   < span class = "comment" > /// memory usage)< / span > < / div >
< div class = "line" > < a name = "l00025" > < / a > < span class = "lineno" > 25< / span >   < span class = "comment" > < / span > constexpr < span class = "keywordtype" > size_t< / span > kNonPinnedPageSize = (size_t) 256 * 1024 * 1024;< / div >
< div class = "line" > < a name = "l00026" > < / a > < span class = "lineno" > 26< / span >   < / div >
< div class = "line" > < a name = "l00027" > < / a > < span class = "lineno" > 27< / span >   < span class = "comment" > // Default size for which we page add or search< / span > < / div >
< div class = "line" > < a name = "l00028" > < / a > < span class = "lineno" > 28< / span >   constexpr < span class = "keywordtype" > size_t< / span > kAddPageSize = (size_t) 256 * 1024 * 1024;< / div >
2018-12-20 00:48:35 +08:00
< div class = "line" > < a name = "l00029" > < / a > < span class = "lineno" > 29< / span >   < / div >
2019-05-28 22:17:22 +08:00
< div class = "line" > < a name = "l00030" > < / a > < span class = "lineno" > 30< / span >   < span class = "comment" > // Or, maximum number of vectors to consider per page of add or search< / span > < / div >
< div class = "line" > < a name = "l00031" > < / a > < span class = "lineno" > 31< / span >   constexpr < span class = "keywordtype" > size_t< / span > kAddVecSize = (size_t) 512 * 1024;< / div >
< div class = "line" > < a name = "l00032" > < / a > < span class = "lineno" > 32< / span >   < / div >
< div class = "line" > < a name = "l00033" > < / a > < span class = "lineno" > 33< / span >   < span class = "comment" > // Use a smaller search size, as precomputed code usage on IVFPQ< / span > < / div >
< div class = "line" > < a name = "l00034" > < / a > < span class = "lineno" > 34< / span >   < span class = "comment" > // requires substantial amounts of memory< / span > < / div >
< div class = "line" > < a name = "l00035" > < / a > < span class = "lineno" > 35< / span >   < span class = "comment" > // FIXME: parameterize based on algorithm need< / span > < / div >
< div class = "line" > < a name = "l00036" > < / a > < span class = "lineno" > 36< / span >   constexpr < span class = "keywordtype" > size_t< / span > kSearchVecSize = (size_t) 32 * 1024;< / div >
< div class = "line" > < a name = "l00037" > < / a > < span class = "lineno" > 37< / span >   < / div >
< div class = "line" > < a name = "l00038" > < / a > < span class = "lineno" > 38< / span >   GpuIndex::GpuIndex(GpuResources* resources,< / div >
< div class = "line" > < a name = "l00039" > < / a > < span class = "lineno" > 39< / span >   < span class = "keywordtype" > int< / span > dims,< / div >
< div class = "line" > < a name = "l00040" > < / a > < span class = "lineno" > 40< / span >   < a class = "code" href = "namespacefaiss.html#afd12191c638da74760ff397cf319752c" > faiss::MetricType< / a > metric,< / div >
< div class = "line" > < a name = "l00041" > < / a > < span class = "lineno" > 41< / span >   GpuIndexConfig config) :< / div >
< div class = "line" > < a name = "l00042" > < / a > < span class = "lineno" > 42< / span >   Index(dims, metric),< / div >
< div class = "line" > < a name = "l00043" > < / a > < span class = "lineno" > 43< / span >   resources_(resources),< / div >
< div class = "line" > < a name = "l00044" > < / a > < span class = "lineno" > 44< / span >   device_(config.device),< / div >
< div class = "line" > < a name = "l00045" > < / a > < span class = "lineno" > 45< / span >   memorySpace_(config.memorySpace),< / div >
< div class = "line" > < a name = "l00046" > < / a > < span class = "lineno" > 46< / span >   minPagedSize_(kMinPageSize) {< / div >
< div class = "line" > < a name = "l00047" > < / a > < span class = "lineno" > 47< / span >   FAISS_THROW_IF_NOT_FMT(device_ < getNumDevices(),< / div >
< div class = "line" > < a name = "l00048" > < / a > < span class = "lineno" > 48< / span >   < span class = "stringliteral" > " Invalid GPU device %d" < / span > , device_);< / div >
< div class = "line" > < a name = "l00049" > < / a > < span class = "lineno" > 49< / span >   < / div >
< div class = "line" > < a name = "l00050" > < / a > < span class = "lineno" > 50< / span >   FAISS_THROW_IF_NOT_MSG(dims > 0, < span class = "stringliteral" > " Invalid number of dimensions" < / span > );< / div >
< div class = "line" > < a name = "l00051" > < / a > < span class = "lineno" > 51< / span >   < / div >
< div class = "line" > < a name = "l00052" > < / a > < span class = "lineno" > 52< / span >   < span class = "preprocessor" > #ifdef FAISS_UNIFIED_MEM< / span > < / div >
< div class = "line" > < a name = "l00053" > < / a > < span class = "lineno" > 53< / span >   < span class = "preprocessor" > < / span > FAISS_THROW_IF_NOT_FMT(< / div >
< div class = "line" > < a name = "l00054" > < / a > < span class = "lineno" > 54< / span >   memorySpace_ == MemorySpace::Device ||< / div >
< div class = "line" > < a name = "l00055" > < / a > < span class = "lineno" > 55< / span >   (memorySpace_ == MemorySpace::Unified & & < / div >
< div class = "line" > < a name = "l00056" > < / a > < span class = "lineno" > 56< / span >   getFullUnifiedMemSupport(device_)),< / div >
< div class = "line" > < a name = "l00057" > < / a > < span class = "lineno" > 57< / span >   < span class = "stringliteral" > " Device %d does not support full CUDA 8 Unified Memory (CC 6.0+)" < / span > ,< / div >
< div class = "line" > < a name = "l00058" > < / a > < span class = "lineno" > 58< / span >   config.device);< / div >
< div class = "line" > < a name = "l00059" > < / a > < span class = "lineno" > 59< / span >   < span class = "preprocessor" > #else< / span > < / div >
< div class = "line" > < a name = "l00060" > < / a > < span class = "lineno" > 60< / span >   < span class = "preprocessor" > < / span > FAISS_THROW_IF_NOT_MSG(memorySpace_ == MemorySpace::Device,< / div >
< div class = "line" > < a name = "l00061" > < / a > < span class = "lineno" > 61< / span >   < span class = "stringliteral" > " Must compile with CUDA 8+ for Unified Memory support" < / span > );< / div >
< div class = "line" > < a name = "l00062" > < / a > < span class = "lineno" > 62< / span >   < span class = "preprocessor" > #endif< / span > < / div >
< div class = "line" > < a name = "l00063" > < / a > < span class = "lineno" > 63< / span >   < span class = "preprocessor" > < / span > < / div >
< div class = "line" > < a name = "l00064" > < / a > < span class = "lineno" > 64< / span >   FAISS_ASSERT(resources_);< / div >
< div class = "line" > < a name = "l00065" > < / a > < span class = "lineno" > 65< / span >   resources_-> initializeForDevice(device_);< / div >
< div class = "line" > < a name = "l00066" > < / a > < span class = "lineno" > 66< / span >   }< / div >
< div class = "line" > < a name = "l00067" > < / a > < span class = "lineno" > 67< / span >   < / div >
< div class = "line" > < a name = "l00068" > < / a > < span class = "lineno" > 68< / span >   < span class = "keywordtype" > void< / span > < / div >
< div class = "line" > < a name = "l00069" > < / a > < span class = "lineno" > < a class = "line" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a6c82cbea6b02cc996d634f822c1d310b" > 69< / a > < / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a6c82cbea6b02cc996d634f822c1d310b" > GpuIndex::setMinPagingSize< / a > (< span class = "keywordtype" > size_t< / span > size) {< / div >
< div class = "line" > < a name = "l00070" > < / a > < span class = "lineno" > 70< / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a32a08664fc4dca2f9405e07ea5bc206f" > minPagedSize_< / a > = size;< / div >
< div class = "line" > < a name = "l00071" > < / a > < span class = "lineno" > 71< / span >   }< / div >
< div class = "line" > < a name = "l00072" > < / a > < span class = "lineno" > 72< / span >   < / div >
< div class = "line" > < a name = "l00073" > < / a > < span class = "lineno" > 73< / span >   < span class = "keywordtype" > size_t< / span > < / div >
< div class = "line" > < a name = "l00074" > < / a > < span class = "lineno" > < a class = "line" href = "classfaiss_1_1gpu_1_1GpuIndex.html#adbdc96814ff2d4390dfd860bd5918203" > 74< / a > < / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#adbdc96814ff2d4390dfd860bd5918203" > GpuIndex::getMinPagingSize< / a > ()< span class = "keyword" > const < / span > {< / div >
< div class = "line" > < a name = "l00075" > < / a > < span class = "lineno" > 75< / span >   < span class = "keywordflow" > return< / span > < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a32a08664fc4dca2f9405e07ea5bc206f" > minPagedSize_< / a > ;< / div >
< div class = "line" > < a name = "l00076" > < / a > < span class = "lineno" > 76< / span >   }< / div >
< div class = "line" > < a name = "l00077" > < / a > < span class = "lineno" > 77< / span >   < / div >
< div class = "line" > < a name = "l00078" > < / a > < span class = "lineno" > 78< / span >   < span class = "keywordtype" > void< / span > < / div >
< div class = "line" > < a name = "l00079" > < / a > < span class = "lineno" > < a class = "line" href = "classfaiss_1_1gpu_1_1GpuIndex.html#af576341f6996b0e80e26b9748db51eb7" > 79< / a > < / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#af576341f6996b0e80e26b9748db51eb7" > GpuIndex::add< / a > (< a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > n, < span class = "keyword" > const< / span > < span class = "keywordtype" > float< / span > * x) {< / div >
< div class = "line" > < a name = "l00080" > < / a > < span class = "lineno" > 80< / span >   < span class = "comment" > // Pass to add_with_ids< / span > < / div >
< div class = "line" > < a name = "l00081" > < / a > < span class = "lineno" > 81< / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a47f6969fe60d82b8e3407557ba9eec88" > add_with_ids< / a > (n, x, < span class = "keyword" > nullptr< / span > );< / div >
< div class = "line" > < a name = "l00082" > < / a > < span class = "lineno" > 82< / span >   }< / div >
< div class = "line" > < a name = "l00083" > < / a > < span class = "lineno" > 83< / span >   < / div >
< div class = "line" > < a name = "l00084" > < / a > < span class = "lineno" > 84< / span >   < span class = "keywordtype" > void< / span > < / div >
< div class = "line" > < a name = "l00085" > < / a > < span class = "lineno" > < a class = "line" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a47f6969fe60d82b8e3407557ba9eec88" > 85< / a > < / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a47f6969fe60d82b8e3407557ba9eec88" > GpuIndex::add_with_ids< / a > (< a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > n,< / div >
< div class = "line" > < a name = "l00086" > < / a > < span class = "lineno" > 86< / span >   < span class = "keyword" > const< / span > < span class = "keywordtype" > float< / span > * x,< / div >
< div class = "line" > < a name = "l00087" > < / a > < span class = "lineno" > 87< / span >   < span class = "keyword" > const< / span > < a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > * ids) {< / div >
< div class = "line" > < a name = "l00088" > < / a > < span class = "lineno" > 88< / span >   FAISS_THROW_IF_NOT_MSG(this-> < a class = "code" href = "structfaiss_1_1Index.html#a6e92732617c4dbe364e7678dd8773a7f" > is_trained< / a > , < span class = "stringliteral" > " Index not trained" < / span > );< / div >
2018-12-20 00:48:35 +08:00
< div class = "line" > < a name = "l00089" > < / a > < span class = "lineno" > 89< / span >   < / div >
2019-05-28 22:17:22 +08:00
< div class = "line" > < a name = "l00090" > < / a > < span class = "lineno" > 90< / span >   < span class = "comment" > // For now, only support < = max int results< / span > < / div >
< div class = "line" > < a name = "l00091" > < / a > < span class = "lineno" > 91< / span >   FAISS_THROW_IF_NOT_FMT(n < = (< a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > ) std::numeric_limits< int> ::max(),< / div >
< div class = "line" > < a name = "l00092" > < / a > < span class = "lineno" > 92< / span >   < span class = "stringliteral" > " GPU index only supports up to %d indices" < / span > ,< / div >
< div class = "line" > < a name = "l00093" > < / a > < span class = "lineno" > 93< / span >   std::numeric_limits< int> ::max());< / div >
< div class = "line" > < a name = "l00094" > < / a > < span class = "lineno" > 94< / span >   < / div >
< div class = "line" > < a name = "l00095" > < / a > < span class = "lineno" > 95< / span >   < span class = "keywordflow" > if< / span > (n == 0) {< / div >
< div class = "line" > < a name = "l00096" > < / a > < span class = "lineno" > 96< / span >   < span class = "comment" > // nothing to add< / span > < / div >
< div class = "line" > < a name = "l00097" > < / a > < span class = "lineno" > 97< / span >   < span class = "keywordflow" > return< / span > ;< / div >
< div class = "line" > < a name = "l00098" > < / a > < span class = "lineno" > 98< / span >   }< / div >
< div class = "line" > < a name = "l00099" > < / a > < span class = "lineno" > 99< / span >   < / div >
< div class = "line" > < a name = "l00100" > < / a > < span class = "lineno" > 100< / span >   std::vector< Index::idx_t> generatedIds;< / div >
< div class = "line" > < a name = "l00101" > < / a > < span class = "lineno" > 101< / span >   < / div >
< div class = "line" > < a name = "l00102" > < / a > < span class = "lineno" > 102< / span >   < span class = "comment" > // Generate IDs if we need them< / span > < / div >
< div class = "line" > < a name = "l00103" > < / a > < span class = "lineno" > 103< / span >   < span class = "keywordflow" > if< / span > (!ids & & < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a358cad8f80a9c4b3aff45f3f7c131d03" > addImplRequiresIDs_< / a > ()) {< / div >
< div class = "line" > < a name = "l00104" > < / a > < span class = "lineno" > 104< / span >   generatedIds = std::vector< Index::idx_t> (n);< / div >
2018-12-20 00:48:35 +08:00
< div class = "line" > < a name = "l00105" > < / a > < span class = "lineno" > 105< / span >   < / div >
2019-05-28 22:17:22 +08:00
< div class = "line" > < a name = "l00106" > < / a > < span class = "lineno" > 106< / span >   < span class = "keywordflow" > for< / span > (< a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > i = 0; i < n; ++i) {< / div >
< div class = "line" > < a name = "l00107" > < / a > < span class = "lineno" > 107< / span >   generatedIds[i] = this-> < a class = "code" href = "structfaiss_1_1Index.html#a6970683faa021b7a6f1a0865c0d4eccd" > ntotal< / a > + i;< / div >
< div class = "line" > < a name = "l00108" > < / a > < span class = "lineno" > 108< / span >   }< / div >
< div class = "line" > < a name = "l00109" > < / a > < span class = "lineno" > 109< / span >   }< / div >
< div class = "line" > < a name = "l00110" > < / a > < span class = "lineno" > 110< / span >   < / div >
< div class = "line" > < a name = "l00111" > < / a > < span class = "lineno" > 111< / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1DeviceScope.html" > DeviceScope< / a > scope(< a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a67750633faa35677ee505a1e61cfe142" > device_< / a > );< / div >
< div class = "line" > < a name = "l00112" > < / a > < span class = "lineno" > 112< / span >   addPaged_((< span class = "keywordtype" > int< / span > ) n, x, ids ? ids : generatedIds.data());< / div >
< div class = "line" > < a name = "l00113" > < / a > < span class = "lineno" > 113< / span >   }< / div >
< div class = "line" > < a name = "l00114" > < / a > < span class = "lineno" > 114< / span >   < / div >
< div class = "line" > < a name = "l00115" > < / a > < span class = "lineno" > 115< / span >   < span class = "keywordtype" > void< / span > < / div >
< div class = "line" > < a name = "l00116" > < / a > < span class = "lineno" > 116< / span >   GpuIndex::addPaged_(< span class = "keywordtype" > int< / span > n,< / div >
< div class = "line" > < a name = "l00117" > < / a > < span class = "lineno" > 117< / span >   < span class = "keyword" > const< / span > < span class = "keywordtype" > float< / span > * x,< / div >
< div class = "line" > < a name = "l00118" > < / a > < span class = "lineno" > 118< / span >   < span class = "keyword" > const< / span > < a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > * ids) {< / div >
< div class = "line" > < a name = "l00119" > < / a > < span class = "lineno" > 119< / span >   < span class = "keywordflow" > if< / span > (n > 0) {< / div >
< div class = "line" > < a name = "l00120" > < / a > < span class = "lineno" > 120< / span >   < span class = "keywordtype" > size_t< / span > totalSize = (size_t) n * this-> < a class = "code" href = "structfaiss_1_1Index.html#a2a002388d2c081c2dbab8508dcefe73d" > d< / a > * < span class = "keyword" > sizeof< / span > (< span class = "keywordtype" > float< / span > );< / div >
< div class = "line" > < a name = "l00121" > < / a > < span class = "lineno" > 121< / span >   < / div >
< div class = "line" > < a name = "l00122" > < / a > < span class = "lineno" > 122< / span >   < span class = "keywordflow" > if< / span > (totalSize > kAddPageSize || n > kAddVecSize) {< / div >
< div class = "line" > < a name = "l00123" > < / a > < span class = "lineno" > 123< / span >   < span class = "comment" > // How many vectors fit into kAddPageSize?< / span > < / div >
< div class = "line" > < a name = "l00124" > < / a > < span class = "lineno" > 124< / span >   < span class = "keywordtype" > size_t< / span > maxNumVecsForPageSize =< / div >
< div class = "line" > < a name = "l00125" > < / a > < span class = "lineno" > 125< / span >   kAddPageSize / ((size_t) this-> < a class = "code" href = "structfaiss_1_1Index.html#a2a002388d2c081c2dbab8508dcefe73d" > d< / a > * < span class = "keyword" > sizeof< / span > (< span class = "keywordtype" > float< / span > ));< / div >
< div class = "line" > < a name = "l00126" > < / a > < span class = "lineno" > 126< / span >   < / div >
< div class = "line" > < a name = "l00127" > < / a > < span class = "lineno" > 127< / span >   < span class = "comment" > // Always add at least 1 vector, if we have huge vectors< / span > < / div >
< div class = "line" > < a name = "l00128" > < / a > < span class = "lineno" > 128< / span >   maxNumVecsForPageSize = std::max(maxNumVecsForPageSize, (< span class = "keywordtype" > size_t< / span > ) 1);< / div >
< div class = "line" > < a name = "l00129" > < / a > < span class = "lineno" > 129< / span >   < / div >
< div class = "line" > < a name = "l00130" > < / a > < span class = "lineno" > 130< / span >   < span class = "keywordtype" > size_t< / span > tileSize = std::min((< span class = "keywordtype" > size_t< / span > ) n, maxNumVecsForPageSize);< / div >
< div class = "line" > < a name = "l00131" > < / a > < span class = "lineno" > 131< / span >   tileSize = std::min(tileSize, kSearchVecSize);< / div >
< div class = "line" > < a name = "l00132" > < / a > < span class = "lineno" > 132< / span >   < / div >
< div class = "line" > < a name = "l00133" > < / a > < span class = "lineno" > 133< / span >   < span class = "keywordflow" > for< / span > (< span class = "keywordtype" > size_t< / span > i = 0; i < (size_t) n; i += tileSize) {< / div >
< div class = "line" > < a name = "l00134" > < / a > < span class = "lineno" > 134< / span >   < span class = "keywordtype" > size_t< / span > curNum = std::min(tileSize, n - i);< / div >
< div class = "line" > < a name = "l00135" > < / a > < span class = "lineno" > 135< / span >   < / div >
< div class = "line" > < a name = "l00136" > < / a > < span class = "lineno" > 136< / span >   addPage_(curNum,< / div >
< div class = "line" > < a name = "l00137" > < / a > < span class = "lineno" > 137< / span >   x + i * (< span class = "keywordtype" > size_t< / span > ) this-> < a class = "code" href = "structfaiss_1_1Index.html#a2a002388d2c081c2dbab8508dcefe73d" > d< / a > ,< / div >
< div class = "line" > < a name = "l00138" > < / a > < span class = "lineno" > 138< / span >   ids ? ids + i : < span class = "keyword" > nullptr< / span > );< / div >
< div class = "line" > < a name = "l00139" > < / a > < span class = "lineno" > 139< / span >   }< / div >
< div class = "line" > < a name = "l00140" > < / a > < span class = "lineno" > 140< / span >   } < span class = "keywordflow" > else< / span > {< / div >
< div class = "line" > < a name = "l00141" > < / a > < span class = "lineno" > 141< / span >   addPage_(n, x, ids);< / div >
< div class = "line" > < a name = "l00142" > < / a > < span class = "lineno" > 142< / span >   }< / div >
< div class = "line" > < a name = "l00143" > < / a > < span class = "lineno" > 143< / span >   }< / div >
< div class = "line" > < a name = "l00144" > < / a > < span class = "lineno" > 144< / span >   }< / div >
< div class = "line" > < a name = "l00145" > < / a > < span class = "lineno" > 145< / span >   < / div >
< div class = "line" > < a name = "l00146" > < / a > < span class = "lineno" > 146< / span >   < span class = "keywordtype" > void< / span > < / div >
< div class = "line" > < a name = "l00147" > < / a > < span class = "lineno" > 147< / span >   GpuIndex::addPage_(< span class = "keywordtype" > int< / span > n,< / div >
< div class = "line" > < a name = "l00148" > < / a > < span class = "lineno" > 148< / span >   < span class = "keyword" > const< / span > < span class = "keywordtype" > float< / span > * x,< / div >
< div class = "line" > < a name = "l00149" > < / a > < span class = "lineno" > 149< / span >   < span class = "keyword" > const< / span > < a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > * ids) {< / div >
< div class = "line" > < a name = "l00150" > < / a > < span class = "lineno" > 150< / span >   < span class = "comment" > // At this point, `x` can be resident on CPU or GPU, and `ids` may be resident< / span > < / div >
< div class = "line" > < a name = "l00151" > < / a > < span class = "lineno" > 151< / span >   < span class = "comment" > // on CPU, GPU or may be null.< / span > < / div >
< div class = "line" > < a name = "l00152" > < / a > < span class = "lineno" > 152< / span >   < span class = "comment" > //< / span > < / div >
< div class = "line" > < a name = "l00153" > < / a > < span class = "lineno" > 153< / span >   < span class = "comment" > // Before continuing, we guarantee that all data will be resident on the GPU.< / span > < / div >
< div class = "line" > < a name = "l00154" > < / a > < span class = "lineno" > 154< / span >   < span class = "keyword" > auto< / span > stream = < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a17b82a8a11783da6eb1b07c9aab98c36" > resources_< / a > -> < a class = "code" href = "classfaiss_1_1gpu_1_1GpuResources.html#aa0354aa570c24e17a9f8a6a45b153ed2" > getDefaultStreamCurrentDevice< / a > ();< / div >
< div class = "line" > < a name = "l00155" > < / a > < span class = "lineno" > 155< / span >   < / div >
< div class = "line" > < a name = "l00156" > < / a > < span class = "lineno" > 156< / span >   < span class = "keyword" > auto< / span > vecs = toDevice< float, 2> (< a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a17b82a8a11783da6eb1b07c9aab98c36" > resources_< / a > ,< / div >
< div class = "line" > < a name = "l00157" > < / a > < span class = "lineno" > 157< / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a67750633faa35677ee505a1e61cfe142" > device_< / a > ,< / div >
< div class = "line" > < a name = "l00158" > < / a > < span class = "lineno" > 158< / span >   < span class = "keyword" > const_cast< < / span > < span class = "keywordtype" > float< / span > *< span class = "keyword" > > < / span > (x),< / div >
< div class = "line" > < a name = "l00159" > < / a > < span class = "lineno" > 159< / span >   stream,< / div >
< div class = "line" > < a name = "l00160" > < / a > < span class = "lineno" > 160< / span >   {n, this-> < a class = "code" href = "structfaiss_1_1Index.html#a2a002388d2c081c2dbab8508dcefe73d" > d< / a > });< / div >
< div class = "line" > < a name = "l00161" > < / a > < span class = "lineno" > 161< / span >   < / div >
< div class = "line" > < a name = "l00162" > < / a > < span class = "lineno" > 162< / span >   < span class = "keywordflow" > if< / span > (ids) {< / div >
< div class = "line" > < a name = "l00163" > < / a > < span class = "lineno" > 163< / span >   < span class = "keyword" > auto< / span > indices = toDevice< Index::idx_t, 1> (< a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a17b82a8a11783da6eb1b07c9aab98c36" > resources_< / a > ,< / div >
< div class = "line" > < a name = "l00164" > < / a > < span class = "lineno" > 164< / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a67750633faa35677ee505a1e61cfe142" > device_< / a > ,< / div >
< div class = "line" > < a name = "l00165" > < / a > < span class = "lineno" > 165< / span >   < span class = "keyword" > const_cast< < / span > < a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > *< span class = "keyword" > > < / span > (ids),< / div >
< div class = "line" > < a name = "l00166" > < / a > < span class = "lineno" > 166< / span >   stream,< / div >
< div class = "line" > < a name = "l00167" > < / a > < span class = "lineno" > 167< / span >   {n});< / div >
< div class = "line" > < a name = "l00168" > < / a > < span class = "lineno" > 168< / span >   < / div >
< div class = "line" > < a name = "l00169" > < / a > < span class = "lineno" > 169< / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#ae8479445214c5ef37adf154c138ce973" > addImpl_< / a > (n, vecs.data(), ids ? indices.data() : < span class = "keyword" > nullptr< / span > );< / div >
< div class = "line" > < a name = "l00170" > < / a > < span class = "lineno" > 170< / span >   } < span class = "keywordflow" > else< / span > {< / div >
< div class = "line" > < a name = "l00171" > < / a > < span class = "lineno" > 171< / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#ae8479445214c5ef37adf154c138ce973" > addImpl_< / a > (n, vecs.data(), < span class = "keyword" > nullptr< / span > );< / div >
< div class = "line" > < a name = "l00172" > < / a > < span class = "lineno" > 172< / span >   }< / div >
< div class = "line" > < a name = "l00173" > < / a > < span class = "lineno" > 173< / span >   }< / div >
< div class = "line" > < a name = "l00174" > < / a > < span class = "lineno" > 174< / span >   < / div >
< div class = "line" > < a name = "l00175" > < / a > < span class = "lineno" > 175< / span >   < span class = "keywordtype" > void< / span > < / div >
< div class = "line" > < a name = "l00176" > < / a > < span class = "lineno" > < a class = "line" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a4564ff946e4339156173b39449562971" > 176< / a > < / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a4564ff946e4339156173b39449562971" > GpuIndex::search< / a > (< a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > n,< / div >
< div class = "line" > < a name = "l00177" > < / a > < span class = "lineno" > 177< / span >   < span class = "keyword" > const< / span > < span class = "keywordtype" > float< / span > * x,< / div >
< div class = "line" > < a name = "l00178" > < / a > < span class = "lineno" > 178< / span >   < a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > k,< / div >
< div class = "line" > < a name = "l00179" > < / a > < span class = "lineno" > 179< / span >   < span class = "keywordtype" > float< / span > * distances,< / div >
< div class = "line" > < a name = "l00180" > < / a > < span class = "lineno" > 180< / span >   < a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > * labels)< span class = "keyword" > const < / span > {< / div >
< div class = "line" > < a name = "l00181" > < / a > < span class = "lineno" > 181< / span >   FAISS_THROW_IF_NOT_MSG(this-> < a class = "code" href = "structfaiss_1_1Index.html#a6e92732617c4dbe364e7678dd8773a7f" > is_trained< / a > , < span class = "stringliteral" > " Index not trained" < / span > );< / div >
< div class = "line" > < a name = "l00182" > < / a > < span class = "lineno" > 182< / span >   < / div >
< div class = "line" > < a name = "l00183" > < / a > < span class = "lineno" > 183< / span >   < span class = "comment" > // For now, only support < = max int results< / span > < / div >
< div class = "line" > < a name = "l00184" > < / a > < span class = "lineno" > 184< / span >   FAISS_THROW_IF_NOT_FMT(n < = (< a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > ) std::numeric_limits< int> ::max(),< / div >
< div class = "line" > < a name = "l00185" > < / a > < span class = "lineno" > 185< / span >   < span class = "stringliteral" > " GPU index only supports up to %d indices" < / span > ,< / div >
< div class = "line" > < a name = "l00186" > < / a > < span class = "lineno" > 186< / span >   std::numeric_limits< int> ::max());< / div >
< div class = "line" > < a name = "l00187" > < / a > < span class = "lineno" > 187< / span >   < / div >
< div class = "line" > < a name = "l00188" > < / a > < span class = "lineno" > 188< / span >   < span class = "comment" > // Maximum k-selection supported is based on the CUDA SDK< / span > < / div >
< div class = "line" > < a name = "l00189" > < / a > < span class = "lineno" > 189< / span >   FAISS_THROW_IF_NOT_FMT(k < = (< a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > ) getMaxKSelection(),< / div >
< div class = "line" > < a name = "l00190" > < / a > < span class = "lineno" > 190< / span >   < span class = "stringliteral" > " GPU index only supports k < = %d (requested %d)" < / span > ,< / div >
< div class = "line" > < a name = "l00191" > < / a > < span class = "lineno" > 191< / span >   getMaxKSelection(),< / div >
< div class = "line" > < a name = "l00192" > < / a > < span class = "lineno" > 192< / span >   (< span class = "keywordtype" > int< / span > ) k); < span class = "comment" > // select limitation< / span > < / div >
< div class = "line" > < a name = "l00193" > < / a > < span class = "lineno" > 193< / span >   < / div >
< div class = "line" > < a name = "l00194" > < / a > < span class = "lineno" > 194< / span >   < span class = "keywordflow" > if< / span > (n == 0 || k == 0) {< / div >
< div class = "line" > < a name = "l00195" > < / a > < span class = "lineno" > 195< / span >   < span class = "comment" > // nothing to search< / span > < / div >
< div class = "line" > < a name = "l00196" > < / a > < span class = "lineno" > 196< / span >   < span class = "keywordflow" > return< / span > ;< / div >
< div class = "line" > < a name = "l00197" > < / a > < span class = "lineno" > 197< / span >   }< / div >
< div class = "line" > < a name = "l00198" > < / a > < span class = "lineno" > 198< / span >   < / div >
< div class = "line" > < a name = "l00199" > < / a > < span class = "lineno" > 199< / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1DeviceScope.html" > DeviceScope< / a > scope(device_);< / div >
< div class = "line" > < a name = "l00200" > < / a > < span class = "lineno" > 200< / span >   < span class = "keyword" > auto< / span > stream = resources_-> getDefaultStream(device_);< / div >
< div class = "line" > < a name = "l00201" > < / a > < span class = "lineno" > 201< / span >   < / div >
< div class = "line" > < a name = "l00202" > < / a > < span class = "lineno" > 202< / span >   < span class = "comment" > // We guarantee that the searchImpl_ will be called with device-resident< / span > < / div >
< div class = "line" > < a name = "l00203" > < / a > < span class = "lineno" > 203< / span >   < span class = "comment" > // pointers.< / span > < / div >
< div class = "line" > < a name = "l00204" > < / a > < span class = "lineno" > 204< / span >   < / div >
< div class = "line" > < a name = "l00205" > < / a > < span class = "lineno" > 205< / span >   < span class = "comment" > // The input vectors may be too large for the GPU, but we still< / span > < / div >
< div class = "line" > < a name = "l00206" > < / a > < span class = "lineno" > 206< / span >   < span class = "comment" > // assume that the output distances and labels are not.< / span > < / div >
< div class = "line" > < a name = "l00207" > < / a > < span class = "lineno" > 207< / span >   < span class = "comment" > // Go ahead and make space for output distances and labels on the< / span > < / div >
< div class = "line" > < a name = "l00208" > < / a > < span class = "lineno" > 208< / span >   < span class = "comment" > // GPU.< / span > < / div >
< div class = "line" > < a name = "l00209" > < / a > < span class = "lineno" > 209< / span >   < span class = "comment" > // If we reach a point where all inputs are too big, we can add< / span > < / div >
< div class = "line" > < a name = "l00210" > < / a > < span class = "lineno" > 210< / span >   < span class = "comment" > // another level of tiling.< / span > < / div >
< div class = "line" > < a name = "l00211" > < / a > < span class = "lineno" > 211< / span >   < span class = "keyword" > auto< / span > outDistances =< / div >
< div class = "line" > < a name = "l00212" > < / a > < span class = "lineno" > 212< / span >   toDevice< float, 2> (< a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a17b82a8a11783da6eb1b07c9aab98c36" > resources_< / a > , < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a67750633faa35677ee505a1e61cfe142" > device_< / a > , distances, stream,< / div >
< div class = "line" > < a name = "l00213" > < / a > < span class = "lineno" > 213< / span >   {(int) n, (< span class = "keywordtype" > int< / span > ) k});< / div >
< div class = "line" > < a name = "l00214" > < / a > < span class = "lineno" > 214< / span >   < / div >
< div class = "line" > < a name = "l00215" > < / a > < span class = "lineno" > 215< / span >   < span class = "keyword" > auto< / span > outLabels =< / div >
< div class = "line" > < a name = "l00216" > < / a > < span class = "lineno" > 216< / span >   toDevice< faiss::Index::idx_t, 2> (< a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a17b82a8a11783da6eb1b07c9aab98c36" > resources_< / a > , < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a67750633faa35677ee505a1e61cfe142" > device_< / a > , labels, stream,< / div >
< div class = "line" > < a name = "l00217" > < / a > < span class = "lineno" > 217< / span >   {(int) n, (< span class = "keywordtype" > int< / span > ) k});< / div >
< div class = "line" > < a name = "l00218" > < / a > < span class = "lineno" > 218< / span >   < / div >
< div class = "line" > < a name = "l00219" > < / a > < span class = "lineno" > 219< / span >   < span class = "keywordtype" > bool< / span > usePaged = < span class = "keyword" > false< / span > ;< / div >
< div class = "line" > < a name = "l00220" > < / a > < span class = "lineno" > 220< / span >   < / div >
< div class = "line" > < a name = "l00221" > < / a > < span class = "lineno" > 221< / span >   < span class = "keywordflow" > if< / span > (getDeviceForAddress(x) == -1) {< / div >
< div class = "line" > < a name = "l00222" > < / a > < span class = "lineno" > 222< / span >   < span class = "comment" > // It is possible that the user is querying for a vector set size< / span > < / div >
< div class = "line" > < a name = "l00223" > < / a > < span class = "lineno" > 223< / span >   < span class = "comment" > // `x` that won' t fit on the GPU.< / span > < / div >
< div class = "line" > < a name = "l00224" > < / a > < span class = "lineno" > 224< / span >   < span class = "comment" > // In this case, we will have to handle paging of the data from CPU< / span > < / div >
< div class = "line" > < a name = "l00225" > < / a > < span class = "lineno" > 225< / span >   < span class = "comment" > // -> GPU.< / span > < / div >
< div class = "line" > < a name = "l00226" > < / a > < span class = "lineno" > 226< / span >   < span class = "comment" > // Currently, we don' t handle the case where the output data won' t< / span > < / div >
< div class = "line" > < a name = "l00227" > < / a > < span class = "lineno" > 227< / span >   < span class = "comment" > // fit on the GPU (e.g., n * k is too large for the GPU memory).< / span > < / div >
< div class = "line" > < a name = "l00228" > < / a > < span class = "lineno" > 228< / span >   < span class = "keywordtype" > size_t< / span > dataSize = (size_t) n * this-> < a class = "code" href = "structfaiss_1_1Index.html#a2a002388d2c081c2dbab8508dcefe73d" > d< / a > * < span class = "keyword" > sizeof< / span > (< span class = "keywordtype" > float< / span > );< / div >
< div class = "line" > < a name = "l00229" > < / a > < span class = "lineno" > 229< / span >   < / div >
< div class = "line" > < a name = "l00230" > < / a > < span class = "lineno" > 230< / span >   < span class = "keywordflow" > if< / span > (dataSize > = < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a32a08664fc4dca2f9405e07ea5bc206f" > minPagedSize_< / a > ) {< / div >
< div class = "line" > < a name = "l00231" > < / a > < span class = "lineno" > 231< / span >   searchFromCpuPaged_(n, x, k,< / div >
< div class = "line" > < a name = "l00232" > < / a > < span class = "lineno" > 232< / span >   outDistances.data(),< / div >
< div class = "line" > < a name = "l00233" > < / a > < span class = "lineno" > 233< / span >   outLabels.data());< / div >
< div class = "line" > < a name = "l00234" > < / a > < span class = "lineno" > 234< / span >   usePaged = < span class = "keyword" > true< / span > ;< / div >
< div class = "line" > < a name = "l00235" > < / a > < span class = "lineno" > 235< / span >   }< / div >
< div class = "line" > < a name = "l00236" > < / a > < span class = "lineno" > 236< / span >   }< / div >
< div class = "line" > < a name = "l00237" > < / a > < span class = "lineno" > 237< / span >   < / div >
< div class = "line" > < a name = "l00238" > < / a > < span class = "lineno" > 238< / span >   < span class = "keywordflow" > if< / span > (!usePaged) {< / div >
< div class = "line" > < a name = "l00239" > < / a > < span class = "lineno" > 239< / span >   searchNonPaged_(n, x, k,< / div >
< div class = "line" > < a name = "l00240" > < / a > < span class = "lineno" > 240< / span >   outDistances.data(),< / div >
< div class = "line" > < a name = "l00241" > < / a > < span class = "lineno" > 241< / span >   outLabels.data());< / div >
< div class = "line" > < a name = "l00242" > < / a > < span class = "lineno" > 242< / span >   }< / div >
< div class = "line" > < a name = "l00243" > < / a > < span class = "lineno" > 243< / span >   < / div >
< div class = "line" > < a name = "l00244" > < / a > < span class = "lineno" > 244< / span >   < span class = "comment" > // Copy back if necessary< / span > < / div >
< div class = "line" > < a name = "l00245" > < / a > < span class = "lineno" > 245< / span >   fromDevice< float, 2> (outDistances, distances, stream);< / div >
< div class = "line" > < a name = "l00246" > < / a > < span class = "lineno" > 246< / span >   fromDevice< faiss::Index::idx_t, 2> (outLabels, labels, stream);< / div >
< div class = "line" > < a name = "l00247" > < / a > < span class = "lineno" > 247< / span >   }< / div >
< div class = "line" > < a name = "l00248" > < / a > < span class = "lineno" > 248< / span >   < / div >
< div class = "line" > < a name = "l00249" > < / a > < span class = "lineno" > 249< / span >   < span class = "keywordtype" > void< / span > < / div >
< div class = "line" > < a name = "l00250" > < / a > < span class = "lineno" > 250< / span >   GpuIndex::searchNonPaged_(< span class = "keywordtype" > int< / span > n,< / div >
< div class = "line" > < a name = "l00251" > < / a > < span class = "lineno" > 251< / span >   < span class = "keyword" > const< / span > < span class = "keywordtype" > float< / span > * x,< / div >
< div class = "line" > < a name = "l00252" > < / a > < span class = "lineno" > 252< / span >   < span class = "keywordtype" > int< / span > k,< / div >
< div class = "line" > < a name = "l00253" > < / a > < span class = "lineno" > 253< / span >   < span class = "keywordtype" > float< / span > * outDistancesData,< / div >
< div class = "line" > < a name = "l00254" > < / a > < span class = "lineno" > 254< / span >   < a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > * outIndicesData)< span class = "keyword" > const < / span > {< / div >
< div class = "line" > < a name = "l00255" > < / a > < span class = "lineno" > 255< / span >   < span class = "keyword" > auto< / span > stream = resources_-> getDefaultStream(device_);< / div >
< div class = "line" > < a name = "l00256" > < / a > < span class = "lineno" > 256< / span >   < / div >
< div class = "line" > < a name = "l00257" > < / a > < span class = "lineno" > 257< / span >   < span class = "comment" > // Make sure arguments are on the device we desire; use temporary< / span > < / div >
< div class = "line" > < a name = "l00258" > < / a > < span class = "lineno" > 258< / span >   < span class = "comment" > // memory allocations to move it if necessary< / span > < / div >
< div class = "line" > < a name = "l00259" > < / a > < span class = "lineno" > 259< / span >   < span class = "keyword" > auto< / span > vecs = toDevice< float, 2> (< a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a17b82a8a11783da6eb1b07c9aab98c36" > resources_< / a > ,< / div >
< div class = "line" > < a name = "l00260" > < / a > < span class = "lineno" > 260< / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a67750633faa35677ee505a1e61cfe142" > device_< / a > ,< / div >
< div class = "line" > < a name = "l00261" > < / a > < span class = "lineno" > 261< / span >   < span class = "keyword" > const_cast< < / span > < span class = "keywordtype" > float< / span > *< span class = "keyword" > > < / span > (x),< / div >
< div class = "line" > < a name = "l00262" > < / a > < span class = "lineno" > 262< / span >   stream,< / div >
< div class = "line" > < a name = "l00263" > < / a > < span class = "lineno" > 263< / span >   {n, (int) this-> < a class = "code" href = "structfaiss_1_1Index.html#a2a002388d2c081c2dbab8508dcefe73d" > d< / a > });< / div >
< div class = "line" > < a name = "l00264" > < / a > < span class = "lineno" > 264< / span >   < / div >
< div class = "line" > < a name = "l00265" > < / a > < span class = "lineno" > 265< / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a184c443785b715fd692b2b67aa71d687" > searchImpl_< / a > (n, vecs.data(), k, outDistancesData, outIndicesData);< / div >
< div class = "line" > < a name = "l00266" > < / a > < span class = "lineno" > 266< / span >   }< / div >
< div class = "line" > < a name = "l00267" > < / a > < span class = "lineno" > 267< / span >   < / div >
< div class = "line" > < a name = "l00268" > < / a > < span class = "lineno" > 268< / span >   < span class = "keywordtype" > void< / span > < / div >
< div class = "line" > < a name = "l00269" > < / a > < span class = "lineno" > 269< / span >   GpuIndex::searchFromCpuPaged_(< span class = "keywordtype" > int< / span > n,< / div >
< div class = "line" > < a name = "l00270" > < / a > < span class = "lineno" > 270< / span >   < span class = "keyword" > const< / span > < span class = "keywordtype" > float< / span > * x,< / div >
< div class = "line" > < a name = "l00271" > < / a > < span class = "lineno" > 271< / span >   < span class = "keywordtype" > int< / span > k,< / div >
< div class = "line" > < a name = "l00272" > < / a > < span class = "lineno" > 272< / span >   < span class = "keywordtype" > float< / span > * outDistancesData,< / div >
< div class = "line" > < a name = "l00273" > < / a > < span class = "lineno" > 273< / span >   < a class = "code" href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > Index::idx_t< / a > * outIndicesData)< span class = "keyword" > const < / span > {< / div >
< div class = "line" > < a name = "l00274" > < / a > < span class = "lineno" > 274< / span >   Tensor< float, 2, true> outDistances(outDistancesData, {n, k});< / div >
< div class = "line" > < a name = "l00275" > < / a > < span class = "lineno" > 275< / span >   Tensor< Index::idx_t, 2, true> outIndices(outIndicesData, {n, k});< / div >
< div class = "line" > < a name = "l00276" > < / a > < span class = "lineno" > 276< / span >   < / div >
< div class = "line" > < a name = "l00277" > < / a > < span class = "lineno" > 277< / span >   < span class = "comment" > // Is pinned memory available?< / span > < / div >
< div class = "line" > < a name = "l00278" > < / a > < span class = "lineno" > 278< / span >   < span class = "keyword" > auto< / span > pinnedAlloc = resources_-> getPinnedMemory();< / div >
< div class = "line" > < a name = "l00279" > < / a > < span class = "lineno" > 279< / span >   < span class = "keywordtype" > int< / span > pageSizeInVecs =< / div >
< div class = "line" > < a name = "l00280" > < / a > < span class = "lineno" > 280< / span >   (int) ((pinnedAlloc.second / 2) / (< span class = "keyword" > sizeof< / span > (float) * this-> < a class = "code" href = "structfaiss_1_1Index.html#a2a002388d2c081c2dbab8508dcefe73d" > d< / a > ));< / div >
< div class = "line" > < a name = "l00281" > < / a > < span class = "lineno" > 281< / span >   < / div >
< div class = "line" > < a name = "l00282" > < / a > < span class = "lineno" > 282< / span >   < span class = "keywordflow" > if< / span > (!pinnedAlloc.first || pageSizeInVecs < 1) {< / div >
< div class = "line" > < a name = "l00283" > < / a > < span class = "lineno" > 283< / span >   < span class = "comment" > // Just page without overlapping copy with compute< / span > < / div >
< div class = "line" > < a name = "l00284" > < / a > < span class = "lineno" > 284< / span >   < span class = "keywordtype" > int< / span > batchSize = utils::nextHighestPowerOf2(< / div >
< div class = "line" > < a name = "l00285" > < / a > < span class = "lineno" > 285< / span >   (< span class = "keywordtype" > int< / span > ) ((< span class = "keywordtype" > size_t< / span > ) kNonPinnedPageSize /< / div >
< div class = "line" > < a name = "l00286" > < / a > < span class = "lineno" > 286< / span >   (< span class = "keyword" > sizeof< / span > (< span class = "keywordtype" > float< / span > ) * this-> < a class = "code" href = "structfaiss_1_1Index.html#a2a002388d2c081c2dbab8508dcefe73d" > d< / a > )));< / div >
< div class = "line" > < a name = "l00287" > < / a > < span class = "lineno" > 287< / span >   < / div >
< div class = "line" > < a name = "l00288" > < / a > < span class = "lineno" > 288< / span >   < span class = "keywordflow" > for< / span > (< span class = "keywordtype" > int< / span > cur = 0; cur < n; cur += batchSize) {< / div >
< div class = "line" > < a name = "l00289" > < / a > < span class = "lineno" > 289< / span >   < span class = "keywordtype" > int< / span > num = std::min(batchSize, n - cur);< / div >
< div class = "line" > < a name = "l00290" > < / a > < span class = "lineno" > 290< / span >   < / div >
< div class = "line" > < a name = "l00291" > < / a > < span class = "lineno" > 291< / span >   < span class = "keyword" > auto< / span > outDistancesSlice = outDistances.narrowOutermost(cur, num);< / div >
< div class = "line" > < a name = "l00292" > < / a > < span class = "lineno" > 292< / span >   < span class = "keyword" > auto< / span > outIndicesSlice = outIndices.narrowOutermost(cur, num);< / div >
< div class = "line" > < a name = "l00293" > < / a > < span class = "lineno" > 293< / span >   < / div >
< div class = "line" > < a name = "l00294" > < / a > < span class = "lineno" > 294< / span >   searchNonPaged_(num,< / div >
< div class = "line" > < a name = "l00295" > < / a > < span class = "lineno" > 295< / span >   x + (< span class = "keywordtype" > size_t< / span > ) cur * this-> < a class = "code" href = "structfaiss_1_1Index.html#a2a002388d2c081c2dbab8508dcefe73d" > d< / a > ,< / div >
< div class = "line" > < a name = "l00296" > < / a > < span class = "lineno" > 296< / span >   k,< / div >
< div class = "line" > < a name = "l00297" > < / a > < span class = "lineno" > 297< / span >   outDistancesSlice.data(),< / div >
< div class = "line" > < a name = "l00298" > < / a > < span class = "lineno" > 298< / span >   outIndicesSlice.data());< / div >
< div class = "line" > < a name = "l00299" > < / a > < span class = "lineno" > 299< / span >   }< / div >
< div class = "line" > < a name = "l00300" > < / a > < span class = "lineno" > 300< / span >   < / div >
< div class = "line" > < a name = "l00301" > < / a > < span class = "lineno" > 301< / span >   < span class = "keywordflow" > return< / span > ;< / div >
< div class = "line" > < a name = "l00302" > < / a > < span class = "lineno" > 302< / span >   }< / div >
< div class = "line" > < a name = "l00303" > < / a > < span class = "lineno" > 303< / span >   < / div >
< div class = "line" > < a name = "l00304" > < / a > < span class = "lineno" > 304< / span >   < span class = "comment" > //< / span > < / div >
< div class = "line" > < a name = "l00305" > < / a > < span class = "lineno" > 305< / span >   < span class = "comment" > // Pinned memory is available, so we can overlap copy with compute.< / span > < / div >
< div class = "line" > < a name = "l00306" > < / a > < span class = "lineno" > 306< / span >   < span class = "comment" > // We use two pinned memory buffers, and triple-buffer the< / span > < / div >
< div class = "line" > < a name = "l00307" > < / a > < span class = "lineno" > 307< / span >   < span class = "comment" > // procedure:< / span > < / div >
< div class = "line" > < a name = "l00308" > < / a > < span class = "lineno" > 308< / span >   < span class = "comment" > //< / span > < / div >
< div class = "line" > < a name = "l00309" > < / a > < span class = "lineno" > 309< / span >   < span class = "comment" > // 1 CPU copy -> pinned< / span > < / div >
< div class = "line" > < a name = "l00310" > < / a > < span class = "lineno" > 310< / span >   < span class = "comment" > // 2 pinned copy -> GPU< / span > < / div >
< div class = "line" > < a name = "l00311" > < / a > < span class = "lineno" > 311< / span >   < span class = "comment" > // 3 GPU compute< / span > < / div >
< div class = "line" > < a name = "l00312" > < / a > < span class = "lineno" > 312< / span >   < span class = "comment" > //< / span > < / div >
< div class = "line" > < a name = "l00313" > < / a > < span class = "lineno" > 313< / span >   < span class = "comment" > // 1 2 3 1 2 3 ... (pinned buf A)< / span > < / div >
< div class = "line" > < a name = "l00314" > < / a > < span class = "lineno" > 314< / span >   < span class = "comment" > // 1 2 3 1 2 ... (pinned buf B)< / span > < / div >
< div class = "line" > < a name = "l00315" > < / a > < span class = "lineno" > 315< / span >   < span class = "comment" > // 1 2 3 1 ... (pinned buf A)< / span > < / div >
< div class = "line" > < a name = "l00316" > < / a > < span class = "lineno" > 316< / span >   < span class = "comment" > // time -> < / span > < / div >
< div class = "line" > < a name = "l00317" > < / a > < span class = "lineno" > 317< / span >   < span class = "comment" > //< / span > < / div >
< div class = "line" > < a name = "l00318" > < / a > < span class = "lineno" > 318< / span >   < span class = "keyword" > auto< / span > defaultStream = resources_-> getDefaultStream(device_);< / div >
< div class = "line" > < a name = "l00319" > < / a > < span class = "lineno" > 319< / span >   < span class = "keyword" > auto< / span > copyStream = resources_-> getAsyncCopyStream(device_);< / div >
< div class = "line" > < a name = "l00320" > < / a > < span class = "lineno" > 320< / span >   < / div >
< div class = "line" > < a name = "l00321" > < / a > < span class = "lineno" > 321< / span >   FAISS_ASSERT((< span class = "keywordtype" > size_t< / span > ) pageSizeInVecs * this-> < a class = "code" href = "structfaiss_1_1Index.html#a2a002388d2c081c2dbab8508dcefe73d" > d< / a > < =< / div >
< div class = "line" > < a name = "l00322" > < / a > < span class = "lineno" > 322< / span >   (< span class = "keywordtype" > size_t< / span > ) std::numeric_limits< int> ::max());< / div >
< div class = "line" > < a name = "l00323" > < / a > < span class = "lineno" > 323< / span >   < / div >
< div class = "line" > < a name = "l00324" > < / a > < span class = "lineno" > 324< / span >   < span class = "keywordtype" > float< / span > * bufPinnedA = (< span class = "keywordtype" > float< / span > *) pinnedAlloc.first;< / div >
< div class = "line" > < a name = "l00325" > < / a > < span class = "lineno" > 325< / span >   < span class = "keywordtype" > float< / span > * bufPinnedB = bufPinnedA + (< span class = "keywordtype" > size_t< / span > ) pageSizeInVecs * this-> < a class = "code" href = "structfaiss_1_1Index.html#a2a002388d2c081c2dbab8508dcefe73d" > d< / a > ;< / div >
< div class = "line" > < a name = "l00326" > < / a > < span class = "lineno" > 326< / span >   < span class = "keywordtype" > float< / span > * bufPinned[2] = {bufPinnedA, bufPinnedB};< / div >
< div class = "line" > < a name = "l00327" > < / a > < span class = "lineno" > 327< / span >   < / div >
< div class = "line" > < a name = "l00328" > < / a > < span class = "lineno" > 328< / span >   < span class = "comment" > // Reserve space on the GPU for the destination of the pinned buffer< / span > < / div >
< div class = "line" > < a name = "l00329" > < / a > < span class = "lineno" > 329< / span >   < span class = "comment" > // copy< / span > < / div >
< div class = "line" > < a name = "l00330" > < / a > < span class = "lineno" > 330< / span >   DeviceTensor< float, 2, true> bufGpuA(< / div >
< div class = "line" > < a name = "l00331" > < / a > < span class = "lineno" > 331< / span >   resources_-> getMemoryManagerCurrentDevice(),< / div >
< div class = "line" > < a name = "l00332" > < / a > < span class = "lineno" > 332< / span >   {(int) pageSizeInVecs, (< span class = "keywordtype" > int< / span > ) this-> d},< / div >
< div class = "line" > < a name = "l00333" > < / a > < span class = "lineno" > 333< / span >   defaultStream);< / div >
< div class = "line" > < a name = "l00334" > < / a > < span class = "lineno" > 334< / span >   DeviceTensor< float, 2, true> bufGpuB(< / div >
< div class = "line" > < a name = "l00335" > < / a > < span class = "lineno" > 335< / span >   resources_-> getMemoryManagerCurrentDevice(),< / div >
< div class = "line" > < a name = "l00336" > < / a > < span class = "lineno" > 336< / span >   {(int) pageSizeInVecs, (< span class = "keywordtype" > int< / span > ) this-> d},< / div >
< div class = "line" > < a name = "l00337" > < / a > < span class = "lineno" > 337< / span >   defaultStream);< / div >
< div class = "line" > < a name = "l00338" > < / a > < span class = "lineno" > 338< / span >   DeviceTensor< float, 2, true> * bufGpus[2] = {& bufGpuA, & bufGpuB};< / div >
< div class = "line" > < a name = "l00339" > < / a > < span class = "lineno" > 339< / span >   < / div >
< div class = "line" > < a name = "l00340" > < / a > < span class = "lineno" > 340< / span >   < span class = "comment" > // Copy completion events for the pinned buffers< / span > < / div >
< div class = "line" > < a name = "l00341" > < / a > < span class = "lineno" > 341< / span >   std::unique_ptr< CudaEvent> eventPinnedCopyDone[2];< / div >
< div class = "line" > < a name = "l00342" > < / a > < span class = "lineno" > 342< / span >   < / div >
< div class = "line" > < a name = "l00343" > < / a > < span class = "lineno" > 343< / span >   < span class = "comment" > // Execute completion events for the GPU buffers< / span > < / div >
< div class = "line" > < a name = "l00344" > < / a > < span class = "lineno" > 344< / span >   std::unique_ptr< CudaEvent> eventGpuExecuteDone[2];< / div >
< div class = "line" > < a name = "l00345" > < / a > < span class = "lineno" > 345< / span >   < / div >
< div class = "line" > < a name = "l00346" > < / a > < span class = "lineno" > 346< / span >   < span class = "comment" > // All offsets are in terms of number of vectors; they remain within< / span > < / div >
< div class = "line" > < a name = "l00347" > < / a > < span class = "lineno" > 347< / span >   < span class = "comment" > // int bounds (as this function only handles max in vectors)< / span > < / div >
< div class = "line" > < a name = "l00348" > < / a > < span class = "lineno" > 348< / span >   < / div >
< div class = "line" > < a name = "l00349" > < / a > < span class = "lineno" > 349< / span >   < span class = "comment" > // Current start offset for buffer 1< / span > < / div >
< div class = "line" > < a name = "l00350" > < / a > < span class = "lineno" > 350< / span >   < span class = "keywordtype" > int< / span > cur1 = 0;< / div >
< div class = "line" > < a name = "l00351" > < / a > < span class = "lineno" > 351< / span >   < span class = "keywordtype" > int< / span > cur1BufIndex = 0;< / div >
< div class = "line" > < a name = "l00352" > < / a > < span class = "lineno" > 352< / span >   < / div >
< div class = "line" > < a name = "l00353" > < / a > < span class = "lineno" > 353< / span >   < span class = "comment" > // Current start offset for buffer 2< / span > < / div >
< div class = "line" > < a name = "l00354" > < / a > < span class = "lineno" > 354< / span >   < span class = "keywordtype" > int< / span > cur2 = -1;< / div >
< div class = "line" > < a name = "l00355" > < / a > < span class = "lineno" > 355< / span >   < span class = "keywordtype" > int< / span > cur2BufIndex = 0;< / div >
< div class = "line" > < a name = "l00356" > < / a > < span class = "lineno" > 356< / span >   < / div >
< div class = "line" > < a name = "l00357" > < / a > < span class = "lineno" > 357< / span >   < span class = "comment" > // Current start offset for buffer 3< / span > < / div >
< div class = "line" > < a name = "l00358" > < / a > < span class = "lineno" > 358< / span >   < span class = "keywordtype" > int< / span > cur3 = -1;< / div >
< div class = "line" > < a name = "l00359" > < / a > < span class = "lineno" > 359< / span >   < span class = "keywordtype" > int< / span > cur3BufIndex = 0;< / div >
< div class = "line" > < a name = "l00360" > < / a > < span class = "lineno" > 360< / span >   < / div >
< div class = "line" > < a name = "l00361" > < / a > < span class = "lineno" > 361< / span >   < span class = "keywordflow" > while< / span > (cur3 < n) {< / div >
< div class = "line" > < a name = "l00362" > < / a > < span class = "lineno" > 362< / span >   < span class = "comment" > // Start async pinned -> GPU copy first (buf 2)< / span > < / div >
< div class = "line" > < a name = "l00363" > < / a > < span class = "lineno" > 363< / span >   < span class = "keywordflow" > if< / span > (cur2 != -1 & & cur2 < n) {< / div >
< div class = "line" > < a name = "l00364" > < / a > < span class = "lineno" > 364< / span >   < span class = "comment" > // Copy pinned to GPU< / span > < / div >
< div class = "line" > < a name = "l00365" > < / a > < span class = "lineno" > 365< / span >   < span class = "keywordtype" > int< / span > numToCopy = std::min(pageSizeInVecs, n - cur2);< / div >
< div class = "line" > < a name = "l00366" > < / a > < span class = "lineno" > 366< / span >   < / div >
< div class = "line" > < a name = "l00367" > < / a > < span class = "lineno" > 367< / span >   < span class = "comment" > // Make sure any previous execution has completed before continuing< / span > < / div >
< div class = "line" > < a name = "l00368" > < / a > < span class = "lineno" > 368< / span >   < span class = "keyword" > auto< / span > & eventPrev = eventGpuExecuteDone[cur2BufIndex];< / div >
< div class = "line" > < a name = "l00369" > < / a > < span class = "lineno" > 369< / span >   < span class = "keywordflow" > if< / span > (eventPrev.get()) {< / div >
< div class = "line" > < a name = "l00370" > < / a > < span class = "lineno" > 370< / span >   eventPrev-> streamWaitOnEvent(copyStream);< / div >
< div class = "line" > < a name = "l00371" > < / a > < span class = "lineno" > 371< / span >   }< / div >
< div class = "line" > < a name = "l00372" > < / a > < span class = "lineno" > 372< / span >   < / div >
< div class = "line" > < a name = "l00373" > < / a > < span class = "lineno" > 373< / span >   CUDA_VERIFY(cudaMemcpyAsync(bufGpus[cur2BufIndex]-> data(),< / div >
< div class = "line" > < a name = "l00374" > < / a > < span class = "lineno" > 374< / span >   bufPinned[cur2BufIndex],< / div >
< div class = "line" > < a name = "l00375" > < / a > < span class = "lineno" > 375< / span >   (< span class = "keywordtype" > size_t< / span > ) numToCopy * this-> d * < span class = "keyword" > sizeof< / span > (< span class = "keywordtype" > float< / span > ),< / div >
< div class = "line" > < a name = "l00376" > < / a > < span class = "lineno" > 376< / span >   cudaMemcpyHostToDevice,< / div >
< div class = "line" > < a name = "l00377" > < / a > < span class = "lineno" > 377< / span >   copyStream));< / div >
< div class = "line" > < a name = "l00378" > < / a > < span class = "lineno" > 378< / span >   < / div >
< div class = "line" > < a name = "l00379" > < / a > < span class = "lineno" > 379< / span >   < span class = "comment" > // Mark a completion event in this stream< / span > < / div >
< div class = "line" > < a name = "l00380" > < / a > < span class = "lineno" > 380< / span >   eventPinnedCopyDone[cur2BufIndex] =< / div >
< div class = "line" > < a name = "l00381" > < / a > < span class = "lineno" > 381< / span >   std::move(std::unique_ptr< CudaEvent> (< span class = "keyword" > new< / span > CudaEvent(copyStream)));< / div >
< div class = "line" > < a name = "l00382" > < / a > < span class = "lineno" > 382< / span >   < / div >
< div class = "line" > < a name = "l00383" > < / a > < span class = "lineno" > 383< / span >   < span class = "comment" > // We pick up from here< / span > < / div >
< div class = "line" > < a name = "l00384" > < / a > < span class = "lineno" > 384< / span >   cur3 = cur2;< / div >
< div class = "line" > < a name = "l00385" > < / a > < span class = "lineno" > 385< / span >   cur2 += numToCopy;< / div >
< div class = "line" > < a name = "l00386" > < / a > < span class = "lineno" > 386< / span >   cur2BufIndex = (cur2BufIndex == 0) ? 1 : 0;< / div >
< div class = "line" > < a name = "l00387" > < / a > < span class = "lineno" > 387< / span >   }< / div >
< div class = "line" > < a name = "l00388" > < / a > < span class = "lineno" > 388< / span >   < / div >
< div class = "line" > < a name = "l00389" > < / a > < span class = "lineno" > 389< / span >   < span class = "keywordflow" > if< / span > (cur3 != -1 & & cur3 < n) {< / div >
< div class = "line" > < a name = "l00390" > < / a > < span class = "lineno" > 390< / span >   < span class = "comment" > // Process on GPU< / span > < / div >
< div class = "line" > < a name = "l00391" > < / a > < span class = "lineno" > 391< / span >   < span class = "keywordtype" > int< / span > numToProcess = std::min(pageSizeInVecs, n - cur3);< / div >
< div class = "line" > < a name = "l00392" > < / a > < span class = "lineno" > 392< / span >   < / div >
< div class = "line" > < a name = "l00393" > < / a > < span class = "lineno" > 393< / span >   < span class = "comment" > // Make sure the previous copy has completed before continuing< / span > < / div >
< div class = "line" > < a name = "l00394" > < / a > < span class = "lineno" > 394< / span >   < span class = "keyword" > auto< / span > & eventPrev = eventPinnedCopyDone[cur3BufIndex];< / div >
< div class = "line" > < a name = "l00395" > < / a > < span class = "lineno" > 395< / span >   FAISS_ASSERT(eventPrev.get());< / div >
< div class = "line" > < a name = "l00396" > < / a > < span class = "lineno" > 396< / span >   < / div >
< div class = "line" > < a name = "l00397" > < / a > < span class = "lineno" > 397< / span >   eventPrev-> streamWaitOnEvent(defaultStream);< / div >
< div class = "line" > < a name = "l00398" > < / a > < span class = "lineno" > 398< / span >   < / div >
< div class = "line" > < a name = "l00399" > < / a > < span class = "lineno" > 399< / span >   < span class = "comment" > // Create tensor wrappers< / span > < / div >
< div class = "line" > < a name = "l00400" > < / a > < span class = "lineno" > 400< / span >   < span class = "comment" > // DeviceTensor< float, 2, true> input(bufGpus[cur3BufIndex]-> data(),< / span > < / div >
< div class = "line" > < a name = "l00401" > < / a > < span class = "lineno" > 401< / span >   < span class = "comment" > // {numToProcess, this-> d});< / span > < / div >
< div class = "line" > < a name = "l00402" > < / a > < span class = "lineno" > 402< / span >   < span class = "keyword" > auto< / span > outDistancesSlice = outDistances.narrowOutermost(cur3, numToProcess);< / div >
< div class = "line" > < a name = "l00403" > < / a > < span class = "lineno" > 403< / span >   < span class = "keyword" > auto< / span > outIndicesSlice = outIndices.narrowOutermost(cur3, numToProcess);< / div >
< div class = "line" > < a name = "l00404" > < / a > < span class = "lineno" > 404< / span >   < / div >
< div class = "line" > < a name = "l00405" > < / a > < span class = "lineno" > 405< / span >   < a class = "code" href = "classfaiss_1_1gpu_1_1GpuIndex.html#a184c443785b715fd692b2b67aa71d687" > searchImpl_< / a > (numToProcess,< / div >
< div class = "line" > < a name = "l00406" > < / a > < span class = "lineno" > 406< / span >   bufGpus[cur3BufIndex]-> data(),< / div >
< div class = "line" > < a name = "l00407" > < / a > < span class = "lineno" > 407< / span >   k,< / div >
< div class = "line" > < a name = "l00408" > < / a > < span class = "lineno" > 408< / span >   outDistancesSlice.data(),< / div >
< div class = "line" > < a name = "l00409" > < / a > < span class = "lineno" > 409< / span >   outIndicesSlice.data());< / div >
< div class = "line" > < a name = "l00410" > < / a > < span class = "lineno" > 410< / span >   < / div >
< div class = "line" > < a name = "l00411" > < / a > < span class = "lineno" > 411< / span >   < span class = "comment" > // Create completion event< / span > < / div >
< div class = "line" > < a name = "l00412" > < / a > < span class = "lineno" > 412< / span >   eventGpuExecuteDone[cur3BufIndex] =< / div >
< div class = "line" > < a name = "l00413" > < / a > < span class = "lineno" > 413< / span >   std::move(std::unique_ptr< CudaEvent> (< span class = "keyword" > new< / span > CudaEvent(defaultStream)));< / div >
< div class = "line" > < a name = "l00414" > < / a > < span class = "lineno" > 414< / span >   < / div >
< div class = "line" > < a name = "l00415" > < / a > < span class = "lineno" > 415< / span >   < span class = "comment" > // We pick up from here< / span > < / div >
< div class = "line" > < a name = "l00416" > < / a > < span class = "lineno" > 416< / span >   cur3BufIndex = (cur3BufIndex == 0) ? 1 : 0;< / div >
< div class = "line" > < a name = "l00417" > < / a > < span class = "lineno" > 417< / span >   cur3 += numToProcess;< / div >
< div class = "line" > < a name = "l00418" > < / a > < span class = "lineno" > 418< / span >   }< / div >
< div class = "line" > < a name = "l00419" > < / a > < span class = "lineno" > 419< / span >   < / div >
< div class = "line" > < a name = "l00420" > < / a > < span class = "lineno" > 420< / span >   < span class = "keywordflow" > if< / span > (cur1 < n) {< / div >
< div class = "line" > < a name = "l00421" > < / a > < span class = "lineno" > 421< / span >   < span class = "comment" > // Copy CPU mem to CPU pinned< / span > < / div >
< div class = "line" > < a name = "l00422" > < / a > < span class = "lineno" > 422< / span >   < span class = "keywordtype" > int< / span > numToCopy = std::min(pageSizeInVecs, n - cur1);< / div >
< div class = "line" > < a name = "l00423" > < / a > < span class = "lineno" > 423< / span >   < / div >
< div class = "line" > < a name = "l00424" > < / a > < span class = "lineno" > 424< / span >   < span class = "comment" > // Make sure any previous copy has completed before continuing< / span > < / div >
< div class = "line" > < a name = "l00425" > < / a > < span class = "lineno" > 425< / span >   < span class = "keyword" > auto< / span > & eventPrev = eventPinnedCopyDone[cur1BufIndex];< / div >
< div class = "line" > < a name = "l00426" > < / a > < span class = "lineno" > 426< / span >   < span class = "keywordflow" > if< / span > (eventPrev.get()) {< / div >
< div class = "line" > < a name = "l00427" > < / a > < span class = "lineno" > 427< / span >   eventPrev-> cpuWaitOnEvent();< / div >
< div class = "line" > < a name = "l00428" > < / a > < span class = "lineno" > 428< / span >   }< / div >
< div class = "line" > < a name = "l00429" > < / a > < span class = "lineno" > 429< / span >   < / div >
< div class = "line" > < a name = "l00430" > < / a > < span class = "lineno" > 430< / span >   memcpy(bufPinned[cur1BufIndex],< / div >
< div class = "line" > < a name = "l00431" > < / a > < span class = "lineno" > 431< / span >   x + (< span class = "keywordtype" > size_t< / span > ) cur1 * this-> d,< / div >
< div class = "line" > < a name = "l00432" > < / a > < span class = "lineno" > 432< / span >   (< span class = "keywordtype" > size_t< / span > ) numToCopy * this-> d * < span class = "keyword" > sizeof< / span > (< span class = "keywordtype" > float< / span > ));< / div >
< div class = "line" > < a name = "l00433" > < / a > < span class = "lineno" > 433< / span >   < / div >
< div class = "line" > < a name = "l00434" > < / a > < span class = "lineno" > 434< / span >   < span class = "comment" > // We pick up from here< / span > < / div >
< div class = "line" > < a name = "l00435" > < / a > < span class = "lineno" > 435< / span >   cur2 = cur1;< / div >
< div class = "line" > < a name = "l00436" > < / a > < span class = "lineno" > 436< / span >   cur1 += numToCopy;< / div >
< div class = "line" > < a name = "l00437" > < / a > < span class = "lineno" > 437< / span >   cur1BufIndex = (cur1BufIndex == 0) ? 1 : 0;< / div >
< div class = "line" > < a name = "l00438" > < / a > < span class = "lineno" > 438< / span >   }< / div >
< div class = "line" > < a name = "l00439" > < / a > < span class = "lineno" > 439< / span >   }< / div >
< div class = "line" > < a name = "l00440" > < / a > < span class = "lineno" > 440< / span >   }< / div >
< div class = "line" > < a name = "l00441" > < / a > < span class = "lineno" > 441< / span >   < / div >
< div class = "line" > < a name = "l00442" > < / a > < span class = "lineno" > 442< / span >   } } < span class = "comment" > // namespace< / span > < / div >
< div class = "ttc" id = "classfaiss_1_1gpu_1_1GpuResources_html_aa0354aa570c24e17a9f8a6a45b153ed2" > < div class = "ttname" > < a href = "classfaiss_1_1gpu_1_1GpuResources.html#aa0354aa570c24e17a9f8a6a45b153ed2" > faiss::gpu::GpuResources::getDefaultStreamCurrentDevice< / a > < / div > < div class = "ttdeci" > cudaStream_t getDefaultStreamCurrentDevice()< / div > < div class = "ttdoc" > Calls getDefaultStream with the current device. < / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "GpuResources_8cpp_source.html#l00023" > GpuResources.cpp:23< / a > < / div > < / div >
< div class = "ttc" id = "classfaiss_1_1gpu_1_1GpuIndex_html_adbdc96814ff2d4390dfd860bd5918203" > < div class = "ttname" > < a href = "classfaiss_1_1gpu_1_1GpuIndex.html#adbdc96814ff2d4390dfd860bd5918203" > faiss::gpu::GpuIndex::getMinPagingSize< / a > < / div > < div class = "ttdeci" > size_t getMinPagingSize() const < / div > < div class = "ttdoc" > Returns the current minimum data size for paged searches. < / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "GpuIndex_8cu_source.html#l00074" > GpuIndex.cu:74< / a > < / div > < / div >
< div class = "ttc" id = "classfaiss_1_1gpu_1_1GpuIndex_html_a184c443785b715fd692b2b67aa71d687" > < div class = "ttname" > < a href = "classfaiss_1_1gpu_1_1GpuIndex.html#a184c443785b715fd692b2b67aa71d687" > faiss::gpu::GpuIndex::searchImpl_< / a > < / div > < div class = "ttdeci" > virtual void searchImpl_(int n, const float *x, int k, float *distances, Index::idx_t *labels) const =0< / div > < / div >
< div class = "ttc" id = "classfaiss_1_1gpu_1_1GpuIndex_html_a358cad8f80a9c4b3aff45f3f7c131d03" > < div class = "ttname" > < a href = "classfaiss_1_1gpu_1_1GpuIndex.html#a358cad8f80a9c4b3aff45f3f7c131d03" > faiss::gpu::GpuIndex::addImplRequiresIDs_< / a > < / div > < div class = "ttdeci" > virtual bool addImplRequiresIDs_() const =0< / div > < / div >
< div class = "ttc" id = "classfaiss_1_1gpu_1_1GpuIndex_html_a47f6969fe60d82b8e3407557ba9eec88" > < div class = "ttname" > < a href = "classfaiss_1_1gpu_1_1GpuIndex.html#a47f6969fe60d82b8e3407557ba9eec88" > faiss::gpu::GpuIndex::add_with_ids< / a > < / div > < div class = "ttdeci" > void add_with_ids(Index::idx_t n, const float *x, const Index::idx_t *ids) override< / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "GpuIndex_8cu_source.html#l00085" > GpuIndex.cu:85< / a > < / div > < / div >
2018-12-20 00:48:35 +08:00
< div class = "ttc" id = "structfaiss_1_1Index_html_a2a002388d2c081c2dbab8508dcefe73d" > < div class = "ttname" > < a href = "structfaiss_1_1Index.html#a2a002388d2c081c2dbab8508dcefe73d" > faiss::Index::d< / a > < / div > < div class = "ttdeci" > int d< / div > < div class = "ttdoc" > vector dimension < / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "Index_8h_source.html#l00066" > Index.h:66< / a > < / div > < / div >
2019-05-28 22:17:22 +08:00
< div class = "ttc" id = "structfaiss_1_1Index_html_ad3f0d3071f987baabbdd3da4500c87ea" > < div class = "ttname" > < a href = "structfaiss_1_1Index.html#ad3f0d3071f987baabbdd3da4500c87ea" > faiss::Index::idx_t< / a > < / div > < div class = "ttdeci" > long idx_t< / div > < div class = "ttdoc" > all indices are this type < / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "Index_8h_source.html#l00062" > Index.h:62< / a > < / div > < / div >
< div class = "ttc" id = "classfaiss_1_1gpu_1_1GpuIndex_html_a67750633faa35677ee505a1e61cfe142" > < div class = "ttname" > < a href = "classfaiss_1_1gpu_1_1GpuIndex.html#a67750633faa35677ee505a1e61cfe142" > faiss::gpu::GpuIndex::device_< / a > < / div > < div class = "ttdeci" > const int device_< / div > < div class = "ttdoc" > The GPU device we are resident on. < / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "GpuIndex_8h_source.html#l00126" > GpuIndex.h:126< / a > < / div > < / div >
< div class = "ttc" id = "classfaiss_1_1gpu_1_1GpuIndex_html_a17b82a8a11783da6eb1b07c9aab98c36" > < div class = "ttname" > < a href = "classfaiss_1_1gpu_1_1GpuIndex.html#a17b82a8a11783da6eb1b07c9aab98c36" > faiss::gpu::GpuIndex::resources_< / a > < / div > < div class = "ttdeci" > GpuResources * resources_< / div > < div class = "ttdoc" > Manages streams, cuBLAS handles and scratch memory for devices. < / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "GpuIndex_8h_source.html#l00123" > GpuIndex.h:123< / a > < / div > < / div >
< div class = "ttc" id = "structfaiss_1_1Index_html_a6970683faa021b7a6f1a0865c0d4eccd" > < div class = "ttname" > < a href = "structfaiss_1_1Index.html#a6970683faa021b7a6f1a0865c0d4eccd" > faiss::Index::ntotal< / a > < / div > < div class = "ttdeci" > idx_t ntotal< / div > < div class = "ttdoc" > total nb of indexed vectors < / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "Index_8h_source.html#l00067" > Index.h:67< / a > < / div > < / div >
< div class = "ttc" id = "classfaiss_1_1gpu_1_1GpuIndex_html_af576341f6996b0e80e26b9748db51eb7" > < div class = "ttname" > < a href = "classfaiss_1_1gpu_1_1GpuIndex.html#af576341f6996b0e80e26b9748db51eb7" > faiss::gpu::GpuIndex::add< / a > < / div > < div class = "ttdeci" > void add(faiss::Index::idx_t, const float *x) override< / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "GpuIndex_8cu_source.html#l00079" > GpuIndex.cu:79< / a > < / div > < / div >
< div class = "ttc" id = "classfaiss_1_1gpu_1_1DeviceScope_html" > < div class = "ttname" > < a href = "classfaiss_1_1gpu_1_1DeviceScope.html" > faiss::gpu::DeviceScope< / a > < / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "DeviceUtils_8h_source.html#l00068" > DeviceUtils.h:68< / a > < / div > < / div >
2018-12-20 00:48:35 +08:00
< div class = "ttc" id = "structfaiss_1_1Index_html_a6e92732617c4dbe364e7678dd8773a7f" > < div class = "ttname" > < a href = "structfaiss_1_1Index.html#a6e92732617c4dbe364e7678dd8773a7f" > faiss::Index::is_trained< / a > < / div > < div class = "ttdeci" > bool is_trained< / div > < div class = "ttdoc" > set if the Index does not require training, or if training is done already < / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "Index_8h_source.html#l00071" > Index.h:71< / a > < / div > < / div >
2019-05-28 22:17:22 +08:00
< div class = "ttc" id = "classfaiss_1_1gpu_1_1GpuIndex_html_a32a08664fc4dca2f9405e07ea5bc206f" > < div class = "ttname" > < a href = "classfaiss_1_1gpu_1_1GpuIndex.html#a32a08664fc4dca2f9405e07ea5bc206f" > faiss::gpu::GpuIndex::minPagedSize_< / a > < / div > < div class = "ttdeci" > size_t minPagedSize_< / div > < div class = "ttdoc" > Size above which we page copies from the CPU to GPU. < / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "GpuIndex_8h_source.html#l00132" > GpuIndex.h:132< / a > < / div > < / div >
< div class = "ttc" id = "classfaiss_1_1gpu_1_1GpuIndex_html_a6c82cbea6b02cc996d634f822c1d310b" > < div class = "ttname" > < a href = "classfaiss_1_1gpu_1_1GpuIndex.html#a6c82cbea6b02cc996d634f822c1d310b" > faiss::gpu::GpuIndex::setMinPagingSize< / a > < / div > < div class = "ttdeci" > void setMinPagingSize(size_t size)< / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "GpuIndex_8cu_source.html#l00069" > GpuIndex.cu:69< / a > < / div > < / div >
< div class = "ttc" id = "classfaiss_1_1gpu_1_1GpuIndex_html_ae8479445214c5ef37adf154c138ce973" > < div class = "ttname" > < a href = "classfaiss_1_1gpu_1_1GpuIndex.html#ae8479445214c5ef37adf154c138ce973" > faiss::gpu::GpuIndex::addImpl_< / a > < / div > < div class = "ttdeci" > virtual void addImpl_(int n, const float *x, const Index::idx_t *ids)=0< / div > < / div >
< div class = "ttc" id = "classfaiss_1_1gpu_1_1GpuIndex_html_a4564ff946e4339156173b39449562971" > < div class = "ttname" > < a href = "classfaiss_1_1gpu_1_1GpuIndex.html#a4564ff946e4339156173b39449562971" > faiss::gpu::GpuIndex::search< / a > < / div > < div class = "ttdeci" > void search(Index::idx_t n, const float *x, Index::idx_t k, float *distances, Index::idx_t *labels) const override< / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "GpuIndex_8cu_source.html#l00176" > GpuIndex.cu:176< / a > < / div > < / div >
< div class = "ttc" id = "namespacefaiss_html_afd12191c638da74760ff397cf319752c" > < div class = "ttname" > < a href = "namespacefaiss.html#afd12191c638da74760ff397cf319752c" > faiss::MetricType< / a > < / div > < div class = "ttdeci" > MetricType< / div > < div class = "ttdoc" > Some algorithms support both an inner product version and a L2 search version. < / div > < div class = "ttdef" > < b > Definition:< / b > < a href = "Index_8h_source.html#l00044" > Index.h:44< / a > < / div > < / div >
2017-02-23 06:26:44 +08:00
< / div > <!-- fragment --> < / div > <!-- contents -->
<!-- start footer part -->
< hr class = "footer" / > < address class = "footer" > < small >
Generated by   < a href = "http://www.doxygen.org/index.html" >
< img class = "footer" src = "doxygen.png" alt = "doxygen" / >
< / a > 1.8.5
< / small > < / address >
< / body >
< / html >