Skip to content

Commit 11bf290

Browse files
sifakisclaude
andcommitted
ex_voxelBlockManager_host_cuda: add -fopenmp-simd compile flag
Activates #pragma omp simd hints in decodeInverseMaps and buildMaskPrefixSums without requiring the OpenMP runtime library, yielding ~10-15% faster CPU decode throughput. Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com> Signed-off-by: Efty Sifakis <esifakis@nvidia.com>
1 parent 8c33baf commit 11bf290

1 file changed

Lines changed: 2 additions & 2 deletions

File tree

nanovdb/nanovdb/examples/CMakeLists.txt

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -117,8 +117,8 @@ nanovdb_example(NAME "ex_coarsen_nanovdb_cuda" OPENVDB)
117117
nanovdb_example(NAME "ex_voxelBlockManager_host_cuda")
118118
if(TARGET ex_voxelBlockManager_host_cuda)
119119
target_compile_options(ex_voxelBlockManager_host_cuda PRIVATE
120-
$<$<COMPILE_LANGUAGE:CUDA>:-Xcompiler=-mavx2>
121-
$<$<COMPILE_LANGUAGE:CXX>:-mavx2>)
120+
$<$<COMPILE_LANGUAGE:CUDA>:-Xcompiler=-mavx2,-fopenmp-simd>
121+
$<$<COMPILE_LANGUAGE:CXX>:-mavx2 -fopenmp-simd>)
122122
endif()
123123

124124
if(CUDAToolkit_FOUND)

0 commit comments

Comments
 (0)