|
153 | 153 | <li class="toctree-l4"><a class="reference internal" href="#kernel_tuner.util.convert_constraint_lambdas"><code class="docutils literal notranslate"><span class="pre">convert_constraint_lambdas()</span></code></a></li> |
154 | 154 | <li class="toctree-l4"><a class="reference internal" href="#kernel_tuner.util.convert_constraint_restriction"><code class="docutils literal notranslate"><span class="pre">convert_constraint_restriction()</span></code></a></li> |
155 | 155 | <li class="toctree-l4"><a class="reference internal" href="#kernel_tuner.util.correct_open_cache"><code class="docutils literal notranslate"><span class="pre">correct_open_cache()</span></code></a></li> |
156 | | -<li class="toctree-l4"><a class="reference internal" href="#kernel_tuner.util.cuda_error_check"><code class="docutils literal notranslate"><span class="pre">cuda_error_check()</span></code></a></li> |
157 | 156 | <li class="toctree-l4"><a class="reference internal" href="#kernel_tuner.util.delete_temp_file"><code class="docutils literal notranslate"><span class="pre">delete_temp_file()</span></code></a></li> |
158 | 157 | <li class="toctree-l4"><a class="reference internal" href="#kernel_tuner.util.detect_language"><code class="docutils literal notranslate"><span class="pre">detect_language()</span></code></a></li> |
159 | 158 | <li class="toctree-l4"><a class="reference internal" href="#kernel_tuner.util.dump_cache"><code class="docutils literal notranslate"><span class="pre">dump_cache()</span></code></a></li> |
|
182 | 181 | <li class="toctree-l4"><a class="reference internal" href="#kernel_tuner.util.replace_param_occurrences"><code class="docutils literal notranslate"><span class="pre">replace_param_occurrences()</span></code></a></li> |
183 | 182 | <li class="toctree-l4"><a class="reference internal" href="#kernel_tuner.util.setup_block_and_grid"><code class="docutils literal notranslate"><span class="pre">setup_block_and_grid()</span></code></a></li> |
184 | 183 | <li class="toctree-l4"><a class="reference internal" href="#kernel_tuner.util.store_cache"><code class="docutils literal notranslate"><span class="pre">store_cache()</span></code></a></li> |
185 | | -<li class="toctree-l4"><a class="reference internal" href="#kernel_tuner.util.to_valid_nvrtc_gpu_arch_cc"><code class="docutils literal notranslate"><span class="pre">to_valid_nvrtc_gpu_arch_cc()</span></code></a></li> |
186 | 184 | <li class="toctree-l4"><a class="reference internal" href="#kernel_tuner.util.unparse_constraint_lambda"><code class="docutils literal notranslate"><span class="pre">unparse_constraint_lambda()</span></code></a></li> |
187 | 185 | <li class="toctree-l4"><a class="reference internal" href="#kernel_tuner.util.write_file"><code class="docutils literal notranslate"><span class="pre">write_file()</span></code></a></li> |
188 | 186 | </ul> |
@@ -834,7 +832,7 @@ <h3>kernel_tuner.backends.nvcuda.CudaFunctions<a class="headerlink" href="#kerne |
834 | 832 | <dl class="py class"> |
835 | 833 | <dt class="sig sig-object py" id="kernel_tuner.backends.nvcuda.CudaFunctions"> |
836 | 834 | <em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">kernel_tuner.backends.nvcuda.</span></span><span class="sig-name descname"><span class="pre">CudaFunctions</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">device</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">0</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">iterations</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">7</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">compiler_options</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">observers</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#kernel_tuner.backends.nvcuda.CudaFunctions" title="Link to this definition">¶</a></dt> |
837 | | -<dd><p>Class that groups the Cuda functions on maintains state about the device.</p> |
| 835 | +<dd><p>Class that groups the Cuda functions and it maintains state about the device.</p> |
838 | 836 | <dl class="py method"> |
839 | 837 | <dt class="sig sig-object py" id="kernel_tuner.backends.nvcuda.CudaFunctions.__init__"> |
840 | 838 | <span class="sig-name descname"><span class="pre">__init__</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">device</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">0</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">iterations</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">7</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">compiler_options</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">observers</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#kernel_tuner.backends.nvcuda.CudaFunctions.__init__" title="Link to this definition">¶</a></dt> |
@@ -1690,12 +1688,6 @@ <h2>Util Functions<a class="headerlink" href="#util-functions" title="Link to th |
1690 | 1688 | <dd><p>If cache file was not properly closed, pretend it was properly closed.</p> |
1691 | 1689 | </dd></dl> |
1692 | 1690 |
|
1693 | | -<dl class="py function"> |
1694 | | -<dt class="sig sig-object py" id="kernel_tuner.util.cuda_error_check"> |
1695 | | -<span class="sig-prename descclassname"><span class="pre">kernel_tuner.util.</span></span><span class="sig-name descname"><span class="pre">cuda_error_check</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">error</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#kernel_tuner.util.cuda_error_check" title="Link to this definition">¶</a></dt> |
1696 | | -<dd><p>Checking the status of CUDA calls using the NVIDIA cuda-python backend.</p> |
1697 | | -</dd></dl> |
1698 | | - |
1699 | 1691 | <dl class="py function"> |
1700 | 1692 | <dt class="sig sig-object py" id="kernel_tuner.util.delete_temp_file"> |
1701 | 1693 | <span class="sig-prename descclassname"><span class="pre">kernel_tuner.util.</span></span><span class="sig-name descname"><span class="pre">delete_temp_file</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">filename</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#kernel_tuner.util.delete_temp_file" title="Link to this definition">¶</a></dt> |
@@ -1980,12 +1972,6 @@ <h2>Util Functions<a class="headerlink" href="#util-functions" title="Link to th |
1980 | 1972 | <dd><p>Stores a new entry (key, params) to the cachefile.</p> |
1981 | 1973 | </dd></dl> |
1982 | 1974 |
|
1983 | | -<dl class="py function"> |
1984 | | -<dt class="sig sig-object py" id="kernel_tuner.util.to_valid_nvrtc_gpu_arch_cc"> |
1985 | | -<span class="sig-prename descclassname"><span class="pre">kernel_tuner.util.</span></span><span class="sig-name descname"><span class="pre">to_valid_nvrtc_gpu_arch_cc</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">compute_capability</span></span><span class="p"><span class="pre">:</span></span><span class="w"> </span><span class="n"><span class="pre">str</span></span></em><span class="sig-paren">)</span> <span class="sig-return"><span class="sig-return-icon">→</span> <span class="sig-return-typehint"><span class="pre">str</span></span></span><a class="headerlink" href="#kernel_tuner.util.to_valid_nvrtc_gpu_arch_cc" title="Link to this definition">¶</a></dt> |
1986 | | -<dd><p>Returns a valid Compute Capability for NVRTC <cite>–gpu-architecture=</cite>, as per <a class="reference external" href="https://docs.nvidia.com/cuda/nvrtc/index.html#group__options">https://docs.nvidia.com/cuda/nvrtc/index.html#group__options</a>.</p> |
1987 | | -</dd></dl> |
1988 | | - |
1989 | 1975 | <dl class="py function"> |
1990 | 1976 | <dt class="sig sig-object py" id="kernel_tuner.util.unparse_constraint_lambda"> |
1991 | 1977 | <span class="sig-prename descclassname"><span class="pre">kernel_tuner.util.</span></span><span class="sig-name descname"><span class="pre">unparse_constraint_lambda</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">lambda_ast</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#kernel_tuner.util.unparse_constraint_lambda" title="Link to this definition">¶</a></dt> |
|
0 commit comments