blob: 70bb876943af5d63fd4c4a102ff96f6c01249d82 [file] [log] [blame]
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
<meta name="generator" content="Doxygen 1.8.13"/>
<meta name="viewport" content="width=device-width, initial-scale=1"/>
<title>mxnet: /work/mxnet/3rdparty/mshadow/mshadow/stream_gpu-inl.h File Reference</title>
<link href="tabs.css" rel="stylesheet" type="text/css"/>
<script type="text/javascript" src="jquery.js"></script>
<script type="text/javascript" src="dynsections.js"></script>
<link href="search/search.css" rel="stylesheet" type="text/css"/>
<script type="text/javascript" src="search/searchdata.js"></script>
<script type="text/javascript" src="search/search.js"></script>
<link href="doxygen.css" rel="stylesheet" type="text/css" />
</head>
<body>
<div id="top"><!-- do not remove this div, it is closed by doxygen! -->
<div id="titlearea">
<table cellspacing="0" cellpadding="0">
<tbody>
<tr style="height: 56px;">
<td id="projectalign" style="padding-left: 0.5em;">
<div id="projectname">mxnet
</div>
</td>
</tr>
</tbody>
</table>
</div>
<!-- end header part -->
<!-- Generated by Doxygen 1.8.13 -->
<script type="text/javascript">
var searchBox = new SearchBox("searchBox", "search",false,'Search');
</script>
<script type="text/javascript" src="menudata.js"></script>
<script type="text/javascript" src="menu.js"></script>
<script type="text/javascript">
$(function() {
initMenu('',true,false,'search.php','Search');
$(document).ready(function() { init_search(); });
});
</script>
<div id="main-nav"></div>
<!-- window showing the filter options -->
<div id="MSearchSelectWindow"
onmouseover="return searchBox.OnSearchSelectShow()"
onmouseout="return searchBox.OnSearchSelectHide()"
onkeydown="return searchBox.OnSearchSelectKey(event)">
</div>
<!-- iframe showing the search results (closed by default) -->
<div id="MSearchResultsWindow">
<iframe src="javascript:void(0)" frameborder="0"
name="MSearchResults" id="MSearchResults">
</iframe>
</div>
<div id="nav-path" class="navpath">
<ul>
<li class="navelem"><a class="el" href="dir_8cab8f464681f7cc51cee77e79a434cd.html">3rdparty</a></li><li class="navelem"><a class="el" href="dir_3e48ced36faa4eaa1b41f6d960bf0edb.html">mshadow</a></li><li class="navelem"><a class="el" href="dir_00b035bb2ad81894e6ad291054ea5f82.html">mshadow</a></li> </ul>
</div>
</div><!-- top -->
<div class="header">
<div class="summary">
<a href="#nested-classes">Classes</a> &#124;
<a href="#namespaces">Namespaces</a> &#124;
<a href="#func-members">Functions</a> </div>
<div class="headertitle">
<div class="title">stream_gpu-inl.h File Reference</div> </div>
</div><!--header-->
<div class="contents">
<p>implementation of GPU code
<a href="#details">More...</a></p>
<div class="textblock"><code>#include &lt;memory&gt;</code><br />
<code>#include &quot;<a class="el" href="3rdparty_2mshadow_2mshadow_2base_8h_source.html">./base.h</a>&quot;</code><br />
<code>#include &quot;<a class="el" href="tensor_8h_source.html">./tensor.h</a>&quot;</code><br />
<code>#include &quot;./logging.h&quot;</code><br />
</div><div class="textblock"><div class="dynheader">
Include dependency graph for stream_gpu-inl.h:</div>
<div class="dyncontent">
<div class="center"><img src="stream__gpu-inl_8h__incl.png" border="0" usemap="#_2work_2mxnet_23rdparty_2mshadow_2mshadow_2stream__gpu-inl_8h" alt=""/></div>
<map name="_2work_2mxnet_23rdparty_2mshadow_2mshadow_2stream__gpu-inl_8h" id="_2work_2mxnet_23rdparty_2mshadow_2mshadow_2stream__gpu-inl_8h">
<area shape="rect" id="node3" href="3rdparty_2mshadow_2mshadow_2base_8h.html" title="./base.h" alt="" coords="2735,423,2809,449"/>
<area shape="rect" id="node28" href="tensor_8h.html" title="header file of tensor data structure and functions This lib requires explicit memory allocation and d..." alt="" coords="2653,109,2736,136"/>
<area shape="rect" id="node22" href="half_8h.html" title="definition of half (float16) type. " alt="" coords="3080,497,3147,524"/>
<area shape="rect" id="node24" href="half2_8h.html" title="definition of vector float16, half2 type. " alt="" coords="3171,497,3245,524"/>
<area shape="rect" id="node26" href="bfloat_8h.html" title="definition of bfloat type. " alt="" coords="3270,497,3349,524"/>
<area shape="rect" id="node30" href="expression_8h.html" title="definitions of abstract expressions and expressions template " alt="" coords="2510,348,2623,375"/>
<area shape="rect" id="node31" href="extension_8h.html" title="some extension of expressions, used to support something beyond elementwise op " alt="" coords="1392,184,1499,211"/>
<area shape="rect" id="node32" href="expr__engine-inl_8h.html" title="definitions of how expressions should be evaluated " alt="" coords="158,266,301,293"/>
<area shape="rect" id="node45" href="tensor__cpu-inl_8h.html" title="implementation of CPU host code " alt="" coords="2351,348,2486,375"/>
<area shape="rect" id="node46" href="tensor__gpu-inl_8h.html" title="implementation of GPU host code " alt="" coords="3127,184,3262,211"/>
<area shape="rect" id="node47" href="3rdparty_2mshadow_2mshadow_2io_8h.html" title="./io.h" alt="" coords="2974,348,3029,375"/>
<area shape="rect" id="node48" href="tensor__container_8h.html" title="tensor container that does memory allocation and resize like STL " alt="" coords="2801,266,2951,293"/>
<area shape="rect" id="node49" href="random_8h.html" title="Random inline functions for tensor. " alt="" coords="2649,184,2741,211"/>
<area shape="rect" id="node50" href="expr__scalar-inl_8h.html" title="definitions of operators in expression with respect to scalar this file will be included several time..." alt="" coords="2966,184,3103,211"/>
<area shape="rect" id="node33" href="broadcast_8h.html" title="support for broadcast and repmat " alt="" coords="995,266,1170,293"/>
<area shape="rect" id="node34" href="unpack__patch2col_8h.html" title="support for unpack " alt="" coords="1194,259,1339,300"/>
<area shape="rect" id="node35" href="pack__col2patch_8h.html" title="support for pack " alt="" coords="1551,266,1761,293"/>
<area shape="rect" id="node36" href="reshape_8h.html" title="support for reshape " alt="" coords="1364,266,1527,293"/>
<area shape="rect" id="node37" href="swapaxis_8h.html" title="support for swapaxis " alt="" coords="1993,266,2164,293"/>
<area shape="rect" id="node38" href="reduceto1d_8h.html" title="support for sum_rows and sumall_except_dim " alt="" coords="1786,266,1969,293"/>
<area shape="rect" id="node39" href="spatial__pool_8h.html" title="support for spatial pooling " alt="" coords="2189,259,2331,300"/>
<area shape="rect" id="node40" href="spatial__unpool_8h.html" title="support for unpool " alt="" coords="2355,259,2498,300"/>
<area shape="rect" id="node41" href="channel__pool_8h.html" title="support for chpool " alt="" coords="325,259,475,300"/>
<area shape="rect" id="node42" href="channel__unpool_8h.html" title="./extension/channel\l_unpool.h" alt="" coords="499,259,648,300"/>
<area shape="rect" id="node43" href="pad_8h.html" title="support for pad " alt="" coords="673,266,807,293"/>
<area shape="rect" id="node44" href="crop_8h.html" title="support for crop " alt="" coords="832,266,971,293"/>
</map>
</div>
</div><div class="textblock"><div class="dynheader">
This graph shows which files directly or indirectly include this file:</div>
<div class="dyncontent">
<div class="center"><img src="stream__gpu-inl_8h__dep__incl.png" border="0" usemap="#_2work_2mxnet_23rdparty_2mshadow_2mshadow_2stream__gpu-inl_8hdep" alt=""/></div>
<map name="_2work_2mxnet_23rdparty_2mshadow_2mshadow_2stream__gpu-inl_8hdep" id="_2work_2mxnet_23rdparty_2mshadow_2mshadow_2stream__gpu-inl_8hdep">
<area shape="rect" id="node2" href="tensor_8h.html" title="header file of tensor data structure and functions This lib requires explicit memory allocation and d..." alt="" coords="5007,109,5219,151"/>
<area shape="rect" id="node3" href="expr__engine-inl_8h.html" title="definitions of how expressions should be evaluated " alt="" coords="4337,199,4527,255"/>
<area shape="rect" id="node26" href="tensor__cpu-inl_8h.html" title="implementation of CPU host code " alt="" coords="4430,303,4631,359"/>
<area shape="rect" id="node27" href="packet-inl_8h.html" title="Generic packet vectorization code. " alt="" coords="4676,206,4913,247"/>
<area shape="rect" id="node30" href="tensor__gpu-inl_8h.html" title="implementation of GPU host code " alt="" coords="4938,199,5139,255"/>
<area shape="rect" id="node31" href="3rdparty_2mshadow_2mshadow_2io_8h.html" title="/work/mxnet/3rdparty\l/mshadow/mshadow/io.h" alt="" coords="5239,206,5423,247"/>
<area shape="rect" id="node32" href="tensor__container_8h.html" title="tensor container that does memory allocation and resize like STL " alt="" coords="5279,303,5481,359"/>
<area shape="rect" id="node33" href="random_8h.html" title="Random inline functions for tensor. " alt="" coords="5253,414,5475,455"/>
<area shape="rect" id="node34" href="include_2mxnet_2base_8h.html" title="/work/mxnet/include\l/mxnet/base.h" alt="" coords="6091,206,6245,247"/>
<area shape="rect" id="node39" href="include_2mxnet_2op__attr__types_8h.html" title="/work/mxnet/include\l/mxnet/op_attr_types.h" alt="" coords="5785,518,5959,559"/>
<area shape="rect" id="node4" href="extension_8h.html" title="some extension of expressions, used to support something beyond elementwise op " alt="" coords="2643,310,2879,351"/>
<area shape="rect" id="node5" href="implicit__gemm_8h.html" title="support for implicit GEMM operation " alt="" coords="5005,407,5229,463"/>
<area shape="rect" id="node6" href="broadcast_8h.html" title="support for broadcast and repmat " alt="" coords="3765,407,3989,463"/>
<area shape="rect" id="node7" href="unpack__patch2col_8h.html" title="support for unpack " alt="" coords="4013,407,4237,463"/>
<area shape="rect" id="node8" href="pack__col2patch_8h.html" title="support for pack " alt="" coords="4261,407,4485,463"/>
<area shape="rect" id="node9" href="reshape_8h.html" title="support for reshape " alt="" coords="4509,407,4733,463"/>
<area shape="rect" id="node10" href="swapaxis_8h.html" title="support for swapaxis " alt="" coords="4757,407,4981,463"/>
<area shape="rect" id="node11" href="reduceto1d_8h.html" title="support for sum_rows and sumall_except_dim " alt="" coords="5,407,229,463"/>
<area shape="rect" id="node12" href="spatial__pool_8h.html" title="support for spatial pooling " alt="" coords="253,407,477,463"/>
<area shape="rect" id="node13" href="spatial__unpool_8h.html" title="support for unpool " alt="" coords="501,407,725,463"/>
<area shape="rect" id="node14" href="channel__pool_8h.html" title="support for chpool " alt="" coords="749,407,973,463"/>
<area shape="rect" id="node15" href="channel__unpool_8h.html" title="/work/mxnet/3rdparty\l/mshadow/mshadow/extension\l/channel_unpool.h" alt="" coords="997,407,1221,463"/>
<area shape="rect" id="node16" href="pad_8h.html" title="support for pad " alt="" coords="1245,414,1509,455"/>
<area shape="rect" id="node17" href="crop_8h.html" title="support for crop " alt="" coords="1533,407,1757,463"/>
<area shape="rect" id="node18" href="mirror_8h.html" title="support for mirror " alt="" coords="1781,407,2005,463"/>
<area shape="rect" id="node19" href="concat_8h.html" title="support for concatenation " alt="" coords="2029,407,2253,463"/>
<area shape="rect" id="node20" href="choose_8h.html" title="support for implicit array selection operation " alt="" coords="2277,407,2501,463"/>
<area shape="rect" id="node21" href="fill_8h.html" title="support for implicit array filling operation " alt="" coords="2525,407,2749,463"/>
<area shape="rect" id="node22" href="one__hot_8h.html" title="Create one&#45;hot indicator array based on the index. " alt="" coords="2773,407,2997,463"/>
<area shape="rect" id="node23" href="slice_8h.html" title="support for slice a certain dimension. " alt="" coords="3021,407,3245,463"/>
<area shape="rect" id="node24" href="slice__ex_8h.html" title="/work/mxnet/3rdparty\l/mshadow/mshadow/extension\l/slice_ex.h" alt="" coords="3269,407,3493,463"/>
<area shape="rect" id="node25" href="take_8h.html" title="/work/mxnet/3rdparty\l/mshadow/mshadow/extension\l/take.h" alt="" coords="3517,407,3741,463"/>
<area shape="rect" id="node28" href="plain-inl_8h.html" title="support of plain packet that use the plain datatype. " alt="" coords="4707,303,4911,359"/>
<area shape="rect" id="node29" href="sse-inl_8h.html" title="support of sse2 packet optimization of some operations " alt="" coords="4935,303,5139,359"/>
<area shape="rect" id="node35" href="packed__func_8h.html" title="Type&#45;erased function used across MXNET API. " alt="" coords="6674,511,6849,567"/>
<area shape="rect" id="node36" href="engine_8h.html" title="Engine that schedules all the operations according to dependency. " alt="" coords="5673,310,5828,351"/>
<area shape="rect" id="node37" href="include_2mxnet_2ndarray_8h.html" title="/work/mxnet/include\l/mxnet/ndarray.h" alt="" coords="6295,414,6449,455"/>
<area shape="rect" id="node38" href="include_2mxnet_2executor_8h.html" title="/work/mxnet/include\l/mxnet/executor.h" alt="" coords="6095,704,6249,745"/>
<area shape="rect" id="node40" href="include_2mxnet_2operator_8h.html" title="/work/mxnet/include\l/mxnet/operator.h" alt="" coords="6095,615,6249,656"/>
<area shape="rect" id="node41" href="operator__util_8h.html" title="Utility functions and registries to help quickly build new operators. [Deprecated] Use the register f..." alt="" coords="6353,704,6519,745"/>
<area shape="rect" id="node45" href="include_2mxnet_2io_8h.html" title="/work/mxnet/include\l/mxnet/io.h" alt="" coords="6180,518,6335,559"/>
<area shape="rect" id="node46" href="resource_8h.html" title="Global resource allocation handling. " alt="" coords="5876,414,6031,455"/>
<area shape="rect" id="node47" href="storage_8h.html" title="Storage manager across multiple devices. " alt="" coords="6231,310,6385,351"/>
<area shape="rect" id="node48" href="random__generator_8h.html" title="Parallel random number generator. " alt="" coords="5852,310,6055,351"/>
<area shape="rect" id="node49" href="rtc_8h.html" title="/work/mxnet/include\l/mxnet/rtc.h" alt="" coords="6409,310,6564,351"/>
<area shape="rect" id="node50" href="tensor__blob_8h.html" title="TBlob class that holds common representation of arbirary dimension tensor, can be used to transformed..." alt="" coords="6588,310,6748,351"/>
<area shape="rect" id="node44" href="utils_8h.html" title="Basic utilility functions. " alt="" coords="5778,793,5966,835"/>
<area shape="rect" id="node43" href="imperative_8h.html" title="/work/mxnet/include\l/mxnet/imperative.h" alt="" coords="5913,704,6068,745"/>
<area shape="rect" id="node42" href="include_2mxnet_2graph__attr__types_8h.html" title="/work/mxnet/include\l/mxnet/graph_attr_types.h" alt="" coords="5775,615,5969,656"/>
</map>
</div>
</div>
<p><a href="stream__gpu-inl_8h_source.html">Go to the source code of this file.</a></p>
<table class="memberdecls">
<tr class="heading"><td colspan="2"><h2 class="groupheader"><a name="nested-classes"></a>
Classes</h2></td></tr>
<tr class="memitem:"><td class="memItemLeft" align="right" valign="top">struct &#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="structmshadow_1_1Stream_3_01gpu_01_4.html">mshadow::Stream&lt; gpu &gt;</a></td></tr>
<tr class="separator:"><td class="memSeparator" colspan="2">&#160;</td></tr>
</table><table class="memberdecls">
<tr class="heading"><td colspan="2"><h2 class="groupheader"><a name="namespaces"></a>
Namespaces</h2></td></tr>
<tr class="memitem:namespacemshadow"><td class="memItemLeft" align="right" valign="top"> &#160;</td><td class="memItemRight" valign="bottom"><a class="el" href="namespacemshadow.html">mshadow</a></td></tr>
<tr class="memdesc:namespacemshadow"><td class="mdescLeft">&#160;</td><td class="mdescRight">overloaded + operator between half_t and bf16_t <br /></td></tr>
<tr class="separator:"><td class="memSeparator" colspan="2">&#160;</td></tr>
</table><table class="memberdecls">
<tr class="heading"><td colspan="2"><h2 class="groupheader"><a name="func-members"></a>
Functions</h2></td></tr>
<tr class="memitem:a5d8687821fd6ecf8e271b996df51415c"><td class="memTemplParams" colspan="2">template&lt;&gt; </td></tr>
<tr class="memitem:a5d8687821fd6ecf8e271b996df51415c"><td class="memTemplItemLeft" align="right" valign="top">void&#160;</td><td class="memTemplItemRight" valign="bottom"><a class="el" href="namespacemshadow.html#a5d8687821fd6ecf8e271b996df51415c">mshadow::DeleteStream&lt; gpu &gt;</a> (Stream&lt; gpu &gt; *stream)</td></tr>
<tr class="separator:a5d8687821fd6ecf8e271b996df51415c"><td class="memSeparator" colspan="2">&#160;</td></tr>
<tr class="memitem:a89b0009770915378c66bc9647040776d"><td class="memTemplParams" colspan="2">template&lt;&gt; </td></tr>
<tr class="memitem:a89b0009770915378c66bc9647040776d"><td class="memTemplItemLeft" align="right" valign="top">Stream&lt; gpu &gt; *&#160;</td><td class="memTemplItemRight" valign="bottom"><a class="el" href="namespacemshadow.html#a89b0009770915378c66bc9647040776d">mshadow::NewStream&lt; gpu &gt;</a> (bool create_blas_handle, bool create_dnn_handle, int dev_id)</td></tr>
<tr class="separator:a89b0009770915378c66bc9647040776d"><td class="memSeparator" colspan="2">&#160;</td></tr>
</table>
<a name="details" id="details"></a><h2 class="groupheader">Detailed Description</h2>
<div class="textblock"><p>implementation of GPU code </p>
<dl class="section author"><dt>Author</dt><dd>Bing Xu, Tianqi Chen </dd></dl>
</div></div><!-- contents -->
<!-- start footer part -->
<hr class="footer"/><address class="footer"><small>
Generated on Thu Jan 5 2023 00:58:43 for mxnet by &#160;<a href="http://www.doxygen.org/index.html">
<img class="footer" src="doxygen.png" alt="doxygen"/>
</a> 1.8.13
</small></address>
</body>
</html>