diff --git a/clang/tools/dpct/generate_api_migration_status.py b/clang/tools/dpct/generate_api_migration_status.py index 9874e629c0f9..6ffe7bc51733 100644 --- a/clang/tools/dpct/generate_api_migration_status.py +++ b/clang/tools/dpct/generate_api_migration_status.py @@ -173,7 +173,9 @@ def do_update(args): warnings.warn("output path is not exist") return False lib_names = ['Runtime_and_Driver', 'CUB', 'cuBLAS', 'cuDNN', 'cuFFT', 'nvGRAPH', 'ASM', - 'cuRAND', 'cuSOLVER', 'cuSPARSE', 'NCCL', 'nvJPEG', 'NVML', 'thrust', 'wmma', 'nvSHMEM'] + 'cuRAND', 'cuSOLVER', 'cuSPARSE', 'NCCL', 'nvJPEG', 'NVML', 'thrust', 'wmma', + 'nvSHMEM', 'cudnn_frontend'] + # lib file name = APINames_$(libname).inc for lib_name in lib_names: if lib_name == 'Runtime_and_Driver': diff --git a/docs/dev_guide/api-mapping-status/ASM_API_migration_status.csv b/docs/dev_guide/api-mapping-status/ASM_API_migration_status.csv index 9ab7cee56299..69c3064cde75 100644 --- a/docs/dev_guide/api-mapping-status/ASM_API_migration_status.csv +++ b/docs/dev_guide/api-mapping-status/ASM_API_migration_status.csv @@ -41,7 +41,7 @@ griddepcontrol,NO, isspacep,NO, istypep,NO, ld,YES, Partial -ldmatrix,YES,Partial +ldmatrix,YES, Partial ldu,NO, lg2,YES, lop3,YES, @@ -89,7 +89,7 @@ sqrt,YES, st,YES, Partial stackrestore,NO, stacksave,NO, -stmatrix,YES,Partial +stmatrix,YES, Partial sub,YES, Partial subc,NO, suld,NO, diff --git a/docs/dev_guide/api-mapping-status/Runtime_and_Driver_API_migration_status.csv b/docs/dev_guide/api-mapping-status/Runtime_and_Driver_API_migration_status.csv index fe1b717b43a6..950a821d7837 100644 --- a/docs/dev_guide/api-mapping-status/Runtime_and_Driver_API_migration_status.csv +++ b/docs/dev_guide/api-mapping-status/Runtime_and_Driver_API_migration_status.csv @@ -76,7 +76,7 @@ cudaEventDestroy,YES,:ref:`DPCT1026` / :ref:`DPCT1027` cudaEventElapsedTime,YES,:ref:`DPCT1012` cudaEventQuery,YES, cudaEventRecord,YES,:ref:`DPCT1012` / :ref:`DPCT1024` -cudaEventRecordWithFlags,NO, +cudaEventRecordWithFlags,YES,:ref:`DPCT1028` cudaEventSynchronize,YES,:ref:`DPCT1012` cudaDestroyExternalMemory,YES, cudaDestroyExternalSemaphore,YES, @@ -909,10 +909,10 @@ __fdiv_rn,YES,:ref:`DPCT1013` __fdiv_ru,YES,:ref:`DPCT1013` __fdiv_rz,YES,:ref:`DPCT1013` __fdividef,YES, -__fmaf_ieee_rd,NO, -__fmaf_ieee_rn,NO, -__fmaf_ieee_ru,NO, -__fmaf_ieee_rz,NO, +__fmaf_ieee_rd,YES,:ref:`DPCT1013` +__fmaf_ieee_rn,YES,:ref:`DPCT1013` +__fmaf_ieee_ru,YES,:ref:`DPCT1013` +__fmaf_ieee_rz,YES,:ref:`DPCT1013` __fmaf_rd,YES,:ref:`DPCT1013` __fmaf_rn,YES,:ref:`DPCT1013` __fmaf_ru,YES,:ref:`DPCT1013` diff --git a/docs/dev_guide/api-mapping-status/cudnn_frontend_API_migration_status.csv b/docs/dev_guide/api-mapping-status/cudnn_frontend_API_migration_status.csv new file mode 100644 index 000000000000..83b4d04562bd --- /dev/null +++ b/docs/dev_guide/api-mapping-status/cudnn_frontend_API_migration_status.csv @@ -0,0 +1,722 @@ +Function,Migration Support,Diagnostic Message +cudnn_frontend::AllowAll,NO, +cudnn_frontend::allowAllConfig,NO, +cudnn_frontend::check_errata,NO, +cudnn_frontend::check_rule,NO, +cudnn_frontend::check_shape,NO, +cudnn_frontend::cudnnReorderFilterAndBiasInt8x32,NO, +cudnn_frontend::filter,NO, +cudnn_frontend::from_json,NO, +cudnn_frontend::getLogger,NO, +cudnn_frontend::getStream,NO, +cudnn_frontend::get_environment,NO, +cudnn_frontend::get_fallback_engine_list,NO, +cudnn_frontend::get_heuristics_list,NO, +cudnn_frontend::get_heuristics_list_impl,NO, +cudnn_frontend::get_pointwise_mode_port_count,NO, +cudnn_frontend::graph::from_json,NO, +cudnn_frontend::graph::to_json,NO, +cudnn_frontend::hasBehaviorNote,NO, +cudnn_frontend::hasNumericalNote,NO, +cudnn_frontend::isLoggingEnabled,NO, +cudnn_frontend::load_from_config,NO, +cudnn_frontend::set_error_and_throw_exception,NO, +cudnn_frontend::to_json,NO, +cudnn_frontend::to_string,NO, +cudnn_frontend::ConvDescBuilder::build,NO, +cudnn_frontend::ConvDescBuilder::setComputePrecision,NO, +cudnn_frontend::ConvDescBuilder::setComputeType,NO, +cudnn_frontend::ConvDescBuilder::setDataType,NO, +cudnn_frontend::ConvDescBuilder::setDilation,NO, +cudnn_frontend::ConvDescBuilder::setMathMode,NO, +cudnn_frontend::ConvDescBuilder::setNDims,NO, +cudnn_frontend::ConvDescBuilder::setPostPadding,NO, +cudnn_frontend::ConvDescBuilder::setPrePadding,NO, +cudnn_frontend::ConvDescBuilder::setSpatialDimCount,NO, +cudnn_frontend::ConvDescBuilder::setSpatialStride,NO, +cudnn_frontend::ConvDescBuilder::setStrides,NO, +cudnn_frontend::ConvDesc::describe,NO, +cudnn_frontend::ConvDesc::getComputePrecision,NO, +cudnn_frontend::ConvDesc::getComputeType,NO, +cudnn_frontend::ConvDesc::getDilation,NO, +cudnn_frontend::ConvDesc::getDimensionCount,NO, +cudnn_frontend::ConvDesc::getMathMode,NO, +cudnn_frontend::ConvDesc::getPadding,NO, +cudnn_frontend::ConvDesc::getSpatialDimCount,NO, +cudnn_frontend::ConvDesc::getSpatialStride,NO, +cudnn_frontend::ConvDesc::getStride,NO, +cudnn_frontend::EngineBuilder::build,NO, +cudnn_frontend::EngineBuilder::setGlobalEngineIdx,NO, +cudnn_frontend::EngineBuilder::setOperationGraph,NO, +cudnn_frontend::EngineConfigBuilder::build,NO, +cudnn_frontend::EngineConfigBuilder::setEngine,NO, +cudnn_frontend::EngineConfig::describe,NO, +cudnn_frontend::EngineConfig::getTag,NO, +cudnn_frontend::EngineFallbackListBuilder::build,NO, +cudnn_frontend::EngineFallbackListBuilder::setOperation,NO, +cudnn_frontend::EngineFallbackListBuilder::setOperationGraph,NO, +cudnn_frontend::EngineFallbackList::describe,NO, +cudnn_frontend::EngineFallbackList::getFallbackList,NO, +cudnn_frontend::EngineHeuristicsBuilder::build,NO, +cudnn_frontend::EngineHeuristicsBuilder::setHeurMode,NO, +cudnn_frontend::EngineHeuristicsBuilder::setOperationGraph,NO, +cudnn_frontend::EngineHeuristicsBuilder::setSMCount,NO, +cudnn_frontend::EngineHeuristics::describe,NO, +cudnn_frontend::EngineHeuristics::getEngineConfig,NO, +cudnn_frontend::EngineHeuristics::getEngineConfigCount,NO, +cudnn_frontend::EngineHeuristics::get_heur_b_mutex,NO, +cudnn_frontend::Engine::buildKnobs,NO, +cudnn_frontend::Engine::describe,NO, +cudnn_frontend::Engine::getFinalizedKnobs,NO, +cudnn_frontend::Engine::getSupportedKnobs,NO, +cudnn_frontend::Engine::getTag,NO, +cudnn_frontend::Engine::knobs_set,NO, +cudnn_frontend::Engine::Knob::describe,NO, +cudnn_frontend::Engine::Knob::getChoice,NO, +cudnn_frontend::Engine::Knob::getKnobType,NO, +cudnn_frontend::Engine::Knob::getMaxValue,NO, +cudnn_frontend::Engine::Knob::getMinValue,NO, +cudnn_frontend::Engine::Knob::getStride,NO, +cudnn_frontend::Engine::Knob::setChoice,NO, +cudnn_frontend::ExecutionPlanBuilder::build,NO, +cudnn_frontend::ExecutionPlanBuilder::loadFromJson,NO, +cudnn_frontend::ExecutionPlanBuilder::setEngineConfig,NO, +cudnn_frontend::ExecutionPlanBuilder::setHandle,NO, +cudnn_frontend::ExecutionPlanCache::add_plan_to_cache,NO, +cudnn_frontend::ExecutionPlanCache::get_name,NO, +cudnn_frontend::ExecutionPlanCache::get_plan_from_cache,NO, +cudnn_frontend::ExecutionPlanCache::is_fastest_plan_stable,NO, +cudnn_frontend::ExecutionPlanCache::is_fastest_plan_stable,NO, +cudnn_frontend::ExecutionPlanCache::set_saturation_count,NO, +cudnn_frontend::ExecutionPlan::buildTag,NO, +cudnn_frontend::ExecutionPlan::computeWorkSpaceSize,NO, +cudnn_frontend::ExecutionPlan::describe,NO, +cudnn_frontend::ExecutionPlan::fetchNotes,NO, +cudnn_frontend::ExecutionPlan::getAllBehaviorNotes,NO, +cudnn_frontend::ExecutionPlan::getAllNumericNotes,NO, +cudnn_frontend::ExecutionPlan::getBehaviorNotes,NO, +cudnn_frontend::ExecutionPlan::getExecutionTime,NO, +cudnn_frontend::ExecutionPlan::getJsonRepresentation,NO, +cudnn_frontend::ExecutionPlan::getNumericNotes,NO, +cudnn_frontend::ExecutionPlan::getTag,NO, +cudnn_frontend::ExecutionPlan::getWorkspaceSize,NO, +cudnn_frontend::ExecutionPlan::setExecutionTime,NO, +cudnn_frontend::ICudnn::create_cudnn_operation_graph,NO, +cudnn_frontend::ICudnn::create_cudnn_tensor,NO, +cudnn_frontend::ICudnn::execute_cudnn_plan_with_uid,NO, +cudnn_frontend::ICudnn::get_cudnn_workspace_size_node,NO, +cudnn_frontend::ICudnn::get_max_cudnn_workspace_size_node,NO, +cudnn_frontend::MatMulDescBuilder::build,NO, +cudnn_frontend::MatMulDescBuilder::setComputeType,NO, +cudnn_frontend::MatMulDescBuilder::setMathPrecision,NO, +cudnn_frontend::MatMulDescBuilder::setPaddingValue,NO, +cudnn_frontend::MatMulDesc::describe,NO, +cudnn_frontend::OperationBuilder::addPeerStatTensor,NO, +cudnn_frontend::OperationBuilder::build,NO, +cudnn_frontend::OperationBuilder::build_bn_bwd_weight_op,NO, +cudnn_frontend::OperationBuilder::build_bn_finalize_op,NO, +cudnn_frontend::OperationBuilder::build_conv_backward_data,NO, +cudnn_frontend::OperationBuilder::build_conv_backward_filter,NO, +cudnn_frontend::OperationBuilder::build_conv_forward,NO, +cudnn_frontend::OperationBuilder::build_genstats_op,NO, +cudnn_frontend::OperationBuilder::build_matmul_op,NO, +cudnn_frontend::OperationBuilder::build_norm_backward,NO, +cudnn_frontend::OperationBuilder::build_norm_forward,NO, +cudnn_frontend::OperationBuilder::build_pointwise_op,NO, +cudnn_frontend::OperationBuilder::build_reduction_op,NO, +cudnn_frontend::OperationBuilder::build_resample_bwd_operation,NO, +cudnn_frontend::OperationBuilder::build_resample_fwd_operation,NO, +cudnn_frontend::OperationBuilder::build_reshape_operation,NO, +cudnn_frontend::OperationBuilder::build_rng_operation,NO, +cudnn_frontend::OperationBuilder::copy_dims_and_strides,NO, +cudnn_frontend::OperationBuilder::extract_feature_vector,NO, +cudnn_frontend::OperationBuilder::setAccumCountTensor,NO, +cudnn_frontend::OperationBuilder::setAlpha,NO, +cudnn_frontend::OperationBuilder::setAlpha2,NO, +cudnn_frontend::OperationBuilder::setBNFinalizeMode,NO, +cudnn_frontend::OperationBuilder::setBeta,NO, +cudnn_frontend::OperationBuilder::setBias,NO, +cudnn_frontend::OperationBuilder::setComputeType,NO, +cudnn_frontend::OperationBuilder::setDBias,NO, +cudnn_frontend::OperationBuilder::setDScale,NO, +cudnn_frontend::OperationBuilder::setDScaleAndDBias,NO, +cudnn_frontend::OperationBuilder::setEpsilonTensor,NO, +cudnn_frontend::OperationBuilder::setEqScaleAndBias,NO, +cudnn_frontend::OperationBuilder::setEqScalesAndBias,NO, +cudnn_frontend::OperationBuilder::setExpDecayFactorTensor,NO, +cudnn_frontend::OperationBuilder::setGenStatsMode,NO, +cudnn_frontend::OperationBuilder::setMathPrecision,NO, +cudnn_frontend::OperationBuilder::setNextRunningMeanAndVar,NO, +cudnn_frontend::OperationBuilder::setNormFwdPhase,NO, +cudnn_frontend::OperationBuilder::setNormalizationMode,NO, +cudnn_frontend::OperationBuilder::setOffsetDesc,NO, +cudnn_frontend::OperationBuilder::setPeerStatTensor,NO, +cudnn_frontend::OperationBuilder::setPrevRunningMeanAndVar,NO, +cudnn_frontend::OperationBuilder::setResampleDesc,NO, +cudnn_frontend::OperationBuilder::setRngDesc,NO, +cudnn_frontend::OperationBuilder::setSavedInvVar,NO, +cudnn_frontend::OperationBuilder::setSavedMeanAndInvVar,NO, +cudnn_frontend::OperationBuilder::setScale,NO, +cudnn_frontend::OperationBuilder::setScaleAndBias,NO, +cudnn_frontend::OperationBuilder::setSeed,NO, +cudnn_frontend::OperationBuilder::setSeedDesc,NO, +cudnn_frontend::OperationBuilder::setSqSumDesc,NO, +cudnn_frontend::OperationBuilder::setSumDesc,NO, +cudnn_frontend::OperationBuilder::setaMatDesc,NO, +cudnn_frontend::OperationBuilder::setbDesc,NO, +cudnn_frontend::OperationBuilder::setbMatDesc,NO, +cudnn_frontend::OperationBuilder::setcDesc,NO, +cudnn_frontend::OperationBuilder::setcMatDesc,NO, +cudnn_frontend::OperationBuilder::setdwDesc,NO, +cudnn_frontend::OperationBuilder::setdxDesc,NO, +cudnn_frontend::OperationBuilder::setdyDesc,NO, +cudnn_frontend::OperationBuilder::setidxDesc,NO, +cudnn_frontend::OperationBuilder::setkOverrideDesc,NO, +cudnn_frontend::OperationBuilder::setmOverrideDesc,NO, +cudnn_frontend::OperationBuilder::setmatmulDesc,NO, +cudnn_frontend::OperationBuilder::setnOverrideDesc,NO, +cudnn_frontend::OperationBuilder::setpwDesc,NO, +cudnn_frontend::OperationBuilder::setreductionDesc,NO, +cudnn_frontend::OperationBuilder::settDesc,NO, +cudnn_frontend::OperationBuilder::setwDesc,NO, +cudnn_frontend::OperationBuilder::setxDesc,NO, +cudnn_frontend::OperationBuilder::setyDesc,NO, +cudnn_frontend::OperationBuilder::validate_bn_bwd_weight_op,NO, +cudnn_frontend::OperationBuilder::validate_convolution_op,NO, +cudnn_frontend::OperationBuilder::validate_matmul_op,NO, +cudnn_frontend::OperationBuilder::validate_norm_op,NO, +cudnn_frontend::OperationBuilder::validate_pointwise_op,NO, +cudnn_frontend::OperationBuilder::validate_reduction_op,NO, +cudnn_frontend::OperationBuilder::validate_resample_op,NO, +cudnn_frontend::OperationBuilder::validate_reshape_op,NO, +cudnn_frontend::OperationBuilder::validate_rng_op,NO, +cudnn_frontend::OperationGraphBuilder::build,NO, +cudnn_frontend::OperationGraphBuilder::setHandle,NO, +cudnn_frontend::OperationGraphBuilder::setOperationGraph,NO, +cudnn_frontend::OperationGraph::describe,NO, +cudnn_frontend::OperationGraph::getEngineCount,NO, +cudnn_frontend::OperationGraph::getFeatureVector,NO, +cudnn_frontend::OperationGraph::getOpCount,NO, +cudnn_frontend::OperationGraph::getOps,NO, +cudnn_frontend::OperationGraph::getTag,NO, +cudnn_frontend::OperationGraph::setFeatureVector,NO, +cudnn_frontend::Operation::describe,NO, +cudnn_frontend::Operation::getFeatureVector,NO, +cudnn_frontend::Operation::getOutputTensor,NO, +cudnn_frontend::Operation::getTag,NO, +cudnn_frontend::PointWiseDescBuilder::build,NO, +cudnn_frontend::PointWiseDescBuilder::setAxis,NO, +cudnn_frontend::PointWiseDescBuilder::setClipping,NO, +cudnn_frontend::PointWiseDescBuilder::setComputeType,NO, +cudnn_frontend::PointWiseDescBuilder::setEluAlpha,NO, +cudnn_frontend::PointWiseDescBuilder::setMathPrecision,NO, +cudnn_frontend::PointWiseDescBuilder::setMode,NO, +cudnn_frontend::PointWiseDescBuilder::setReluLowerClip,NO, +cudnn_frontend::PointWiseDescBuilder::setReluLowerClipSlope,NO, +cudnn_frontend::PointWiseDescBuilder::setReluUpperClip,NO, +cudnn_frontend::PointWiseDescBuilder::setSoftplusBeta,NO, +cudnn_frontend::PointWiseDescBuilder::setSwishBeta,NO, +cudnn_frontend::PointWiseDesc::describe,NO, +cudnn_frontend::PointWiseDesc::getPointWiseMode,NO, +cudnn_frontend::PointWiseDesc::getPortCount,NO, +cudnn_frontend::ReductionDescBuilder::build,NO, +cudnn_frontend::ReductionDescBuilder::setComputeType,NO, +cudnn_frontend::ReductionDescBuilder::setMathPrecision,NO, +cudnn_frontend::ReductionDescBuilder::setReductionOp,NO, +cudnn_frontend::ReductionDesc::describe,NO, +cudnn_frontend::ResampleDescBuilder::build,NO, +cudnn_frontend::ResampleDescBuilder::setComputeType,NO, +cudnn_frontend::ResampleDescBuilder::setNanPropagation,NO, +cudnn_frontend::ResampleDescBuilder::setPaddingMode,NO, +cudnn_frontend::ResampleDescBuilder::setPostPadding,NO, +cudnn_frontend::ResampleDescBuilder::setPrePadding,NO, +cudnn_frontend::ResampleDescBuilder::setResampleMode,NO, +cudnn_frontend::ResampleDescBuilder::setSpatialDim,NO, +cudnn_frontend::ResampleDescBuilder::setSpatialStride,NO, +cudnn_frontend::ResampleDesc::describe,NO, +cudnn_frontend::ResampleDesc::getComputeType,NO, +cudnn_frontend::ResampleDesc::getMode,NO, +cudnn_frontend::ResampleDesc::getNanOpt,NO, +cudnn_frontend::ResampleDesc::getPaddingMode,NO, +cudnn_frontend::ResampleDesc::getPostPadding,NO, +cudnn_frontend::ResampleDesc::getPrePadding,NO, +cudnn_frontend::ResampleDesc::getSpatialDimCount,NO, +cudnn_frontend::ResampleDesc::getSpatialStride,NO, +cudnn_frontend::ResampleDesc::getWindowDim,NO, +cudnn_frontend::RngDescBuilder::build,NO, +cudnn_frontend::RngDescBuilder::setBernoulliDistProbability,NO, +cudnn_frontend::RngDescBuilder::setNormalDistMean,NO, +cudnn_frontend::RngDescBuilder::setNormalDistParams,NO, +cudnn_frontend::RngDescBuilder::setNormalDistStdDev,NO, +cudnn_frontend::RngDescBuilder::setRngDistribution,NO, +cudnn_frontend::RngDescBuilder::setUniformDistMax,NO, +cudnn_frontend::RngDescBuilder::setUniformDistMin,NO, +cudnn_frontend::RngDescBuilder::setUniformDistParams,NO, +cudnn_frontend::RngDesc::describe,NO, +cudnn_frontend::RngDesc::getBernoulliDistProbability,NO, +cudnn_frontend::RngDesc::getDistribution,NO, +cudnn_frontend::RngDesc::getNormalDistMean,NO, +cudnn_frontend::RngDesc::getNormalDistStdDev,NO, +cudnn_frontend::RngDesc::getUniformDistMax,NO, +cudnn_frontend::RngDesc::getUniformDistMin,NO, +cudnn_frontend::TensorBuilder::build,NO, +cudnn_frontend::TensorBuilder::cloneFrom,NO, +cudnn_frontend::TensorBuilder::setAlignment,NO, +cudnn_frontend::TensorBuilder::setByValue,NO, +cudnn_frontend::TensorBuilder::setDataType,NO, +cudnn_frontend::TensorBuilder::setDim,NO, +cudnn_frontend::TensorBuilder::setId,NO, +cudnn_frontend::TensorBuilder::setRaggedOffset,NO, +cudnn_frontend::TensorBuilder::setReorderType,NO, +cudnn_frontend::TensorBuilder::setStride,NO, +cudnn_frontend::TensorBuilder::setStrides,NO, +cudnn_frontend::TensorBuilder::setVectorCountAndDimension,NO, +cudnn_frontend::TensorBuilder::setVirtual,NO, +cudnn_frontend::Tensor::describe,NO, +cudnn_frontend::Tensor::getAlignment,NO, +cudnn_frontend::Tensor::getDataType,NO, +cudnn_frontend::Tensor::getDim,NO, +cudnn_frontend::Tensor::getDimArray,NO, +cudnn_frontend::Tensor::getDimCount,NO, +cudnn_frontend::Tensor::getDimensionCount,NO, +cudnn_frontend::Tensor::getId,NO, +cudnn_frontend::Tensor::getPackedElementCount,NO, +cudnn_frontend::Tensor::getStride,NO, +cudnn_frontend::Tensor::getStrideArray,NO, +cudnn_frontend::Tensor::isVirtualTensor,NO, +cudnn_frontend::VariantPackBuilder::build,NO, +cudnn_frontend::VariantPackBuilder::setDataPointers,NO, +cudnn_frontend::VariantPackBuilder::setUids,NO, +cudnn_frontend::VariantPackBuilder::setWorkspacePointer,NO, +cudnn_frontend::VariantPack::describe,NO, +cudnn_frontend::cudnnException::getCudnnStatus,NO, +cudnn_frontend::cudnnException::what,NO, +cudnn_frontend::cudnnGraphNotSupportedException::what,NO, +cudnn_frontend::error_object::get_code,NO, +cudnn_frontend::error_object::get_message,NO, +cudnn_frontend::error_object::is_bad,NO, +cudnn_frontend::error_object::is_good,NO, +cudnn_frontend::graph::Attributes::fill_from_context,NO, +cudnn_frontend::graph::Attributes::fill_pass_by_value,NO, +cudnn_frontend::graph::Attributes::get_non_virtual_uids,NO, +cudnn_frontend::graph::Attributes::get_prefilled_uids,NO, +cudnn_frontend::graph::Attributes::self,NO, +cudnn_frontend::graph::Attributes::set_compute_data_type,NO, +cudnn_frontend::graph::Attributes::set_name,NO, +cudnn_frontend::graph::Attributes::set_uids,NO, +cudnn_frontend::graph::Attributes::validate_inputs,NO, +cudnn_frontend::graph::Attributes::validate_outputs,NO, +cudnn_frontend::graph::BN_finalize_attributes::set_previous_running_stats,NO, +cudnn_frontend::graph::BatchNormFinalizeNode::create_cudnn_operations,NO, +cudnn_frontend::graph::BatchNormFinalizeNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::BatchNormFinalizeNode::getType,NO, +cudnn_frontend::graph::BatchNormFinalizeNode::post_validate_node,NO, +cudnn_frontend::graph::BatchNormFinalizeNode::pre_validate_node,NO, +cudnn_frontend::graph::BatchNormFinalizeNode::serialize,NO, +cudnn_frontend::graph::BatchNormNode::create_cudnn_operations,NO, +cudnn_frontend::graph::BatchNormNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::BatchNormNode::getType,NO, +cudnn_frontend::graph::BatchNormNode::post_validate_node,NO, +cudnn_frontend::graph::BatchNormNode::pre_validate_node,NO, +cudnn_frontend::graph::BatchNormNode::serialize,NO, +cudnn_frontend::graph::BatchnormInferenceNode::create_cudnn_operations,NO, +cudnn_frontend::graph::BatchnormInferenceNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::BatchnormInferenceNode::getType,NO, +cudnn_frontend::graph::BatchnormInferenceNode::post_validate_node,NO, +cudnn_frontend::graph::BatchnormInferenceNode::pre_validate_node,NO, +cudnn_frontend::graph::BatchnormInferenceNode::serialize,NO, +cudnn_frontend::graph::Batchnorm_attributes::set_epsilon,NO, +cudnn_frontend::graph::Batchnorm_attributes::set_peer_stats,NO, +cudnn_frontend::graph::Batchnorm_attributes::set_previous_running_stats,NO, +cudnn_frontend::graph::Batchnorm_backward_attributes::set_peer_stats,NO, +cudnn_frontend::graph::Batchnorm_backward_attributes::set_saved_mean_and_inv_variance,NO, +cudnn_frontend::graph::Conv_dgrad_attributes::get_dilation,NO, +cudnn_frontend::graph::Conv_dgrad_attributes::get_post_padding,NO, +cudnn_frontend::graph::Conv_dgrad_attributes::get_pre_padding,NO, +cudnn_frontend::graph::Conv_dgrad_attributes::get_stride,NO, +cudnn_frontend::graph::Conv_dgrad_attributes::set_dilation,NO, +cudnn_frontend::graph::Conv_dgrad_attributes::set_padding,NO, +cudnn_frontend::graph::Conv_dgrad_attributes::set_post_padding,NO, +cudnn_frontend::graph::Conv_dgrad_attributes::set_pre_padding,NO, +cudnn_frontend::graph::Conv_dgrad_attributes::set_stride,NO, +cudnn_frontend::graph::Conv_fprop_attributes::get_dilation,NO, +cudnn_frontend::graph::Conv_fprop_attributes::get_post_padding,NO, +cudnn_frontend::graph::Conv_fprop_attributes::get_pre_padding,NO, +cudnn_frontend::graph::Conv_fprop_attributes::get_stride,NO, +cudnn_frontend::graph::Conv_fprop_attributes::set_dilation,NO, +cudnn_frontend::graph::Conv_fprop_attributes::set_padding,NO, +cudnn_frontend::graph::Conv_fprop_attributes::set_post_padding,NO, +cudnn_frontend::graph::Conv_fprop_attributes::set_pre_padding,NO, +cudnn_frontend::graph::Conv_fprop_attributes::set_stride,NO, +cudnn_frontend::graph::Conv_wgrad_attributes::get_dilation,NO, +cudnn_frontend::graph::Conv_wgrad_attributes::get_post_padding,NO, +cudnn_frontend::graph::Conv_wgrad_attributes::get_pre_padding,NO, +cudnn_frontend::graph::Conv_wgrad_attributes::get_stride,NO, +cudnn_frontend::graph::Conv_wgrad_attributes::set_dilation,NO, +cudnn_frontend::graph::Conv_wgrad_attributes::set_padding,NO, +cudnn_frontend::graph::Conv_wgrad_attributes::set_post_padding,NO, +cudnn_frontend::graph::Conv_wgrad_attributes::set_pre_padding,NO, +cudnn_frontend::graph::Conv_wgrad_attributes::set_stride,NO, +cudnn_frontend::graph::ConvolutionNode::create_cudnn_operations,NO, +cudnn_frontend::graph::ConvolutionNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::ConvolutionNode::getType,NO, +cudnn_frontend::graph::ConvolutionNode::post_validate_node,NO, +cudnn_frontend::graph::ConvolutionNode::pre_validate_node,NO, +cudnn_frontend::graph::ConvolutionNode::serialize,NO, +cudnn_frontend::graph::DBNNode::create_cudnn_operations,NO, +cudnn_frontend::graph::DBNNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::DBNNode::getType,NO, +cudnn_frontend::graph::DBNNode::post_validate_node,NO, +cudnn_frontend::graph::DBNNode::pre_validate_node,NO, +cudnn_frontend::graph::DBNNode::serialize,NO, +cudnn_frontend::graph::DBNWeightNode::create_cudnn_operations,NO, +cudnn_frontend::graph::DBNWeightNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::DBNWeightNode::getType,NO, +cudnn_frontend::graph::DBNWeightNode::post_validate_node,NO, +cudnn_frontend::graph::DBNWeightNode::pre_validate_node,NO, +cudnn_frontend::graph::DBNWeightNode::serialize,NO, +cudnn_frontend::graph::DINNode::create_cudnn_operations,NO, +cudnn_frontend::graph::DINNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::DINNode::getType,NO, +cudnn_frontend::graph::DINNode::post_validate_node,NO, +cudnn_frontend::graph::DINNode::pre_validate_node,NO, +cudnn_frontend::graph::DINNode::serialize,NO, +cudnn_frontend::graph::DLNNode::create_cudnn_operations,NO, +cudnn_frontend::graph::DLNNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::DLNNode::getType,NO, +cudnn_frontend::graph::DLNNode::post_validate_node,NO, +cudnn_frontend::graph::DLNNode::pre_validate_node,NO, +cudnn_frontend::graph::DLNNode::serialize,NO, +cudnn_frontend::graph::DRMSNormNode::create_cudnn_operations,NO, +cudnn_frontend::graph::DRMSNormNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::DRMSNormNode::getType,NO, +cudnn_frontend::graph::DRMSNormNode::post_validate_node,NO, +cudnn_frontend::graph::DRMSNormNode::pre_validate_node,NO, +cudnn_frontend::graph::DRMSNormNode::serialize,NO, +cudnn_frontend::graph::DgradNode::create_cudnn_operations,NO, +cudnn_frontend::graph::DgradNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::DgradNode::getType,NO, +cudnn_frontend::graph::DgradNode::post_validate_node,NO, +cudnn_frontend::graph::DgradNode::pre_validate_node,NO, +cudnn_frontend::graph::DgradNode::serialize,NO, +cudnn_frontend::graph::Execution_plan_list::_build_plan_at_index_impl,NO, +cudnn_frontend::graph::Execution_plan_list::autotune,NO, +cudnn_frontend::graph::Execution_plan_list::autotune_default_impl,NO, +cudnn_frontend::graph::Execution_plan_list::build_plan_at_index,NO, +cudnn_frontend::graph::Execution_plan_list::build_plans,NO, +cudnn_frontend::graph::Execution_plan_list::check_support,NO, +cudnn_frontend::graph::Execution_plan_list::check_support_at_index,NO, +cudnn_frontend::graph::Execution_plan_list::filter_behavior_notes,NO, +cudnn_frontend::graph::Execution_plan_list::filter_numeric_notes,NO, +cudnn_frontend::graph::Execution_plan_list::get_autotune_workspace,NO, +cudnn_frontend::graph::Execution_plan_list::get_barred_engine_configs,NO, +cudnn_frontend::graph::Execution_plan_list::get_execution_plans,NO, +cudnn_frontend::graph::Execution_plan_list::is_plan_index_executable,NO, +cudnn_frontend::graph::Execution_plan_list::query_properties,NO, +cudnn_frontend::graph::Execution_plan_list::set_barred_names,NO, +cudnn_frontend::graph::Execution_plan_list::set_engine_configs,NO, +cudnn_frontend::graph::Execution_plan_list::set_max_shared_mem_allowed,NO, +cudnn_frontend::graph::Execution_plan_list::set_max_workspace_allowed,NO, +cudnn_frontend::graph::Execution_plan_list::set_tag,NO, +cudnn_frontend::graph::GenstatsNode::create_cudnn_operations,NO, +cudnn_frontend::graph::GenstatsNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::GenstatsNode::getType,NO, +cudnn_frontend::graph::GenstatsNode::post_validate_node,NO, +cudnn_frontend::graph::GenstatsNode::pre_validate_node,NO, +cudnn_frontend::graph::GenstatsNode::serialize,NO, +cudnn_frontend::graph::Graph::add_to_tensor_map,NO, +cudnn_frontend::graph::Graph::batchnorm,NO, +cudnn_frontend::graph::Graph::batchnorm_backward,NO, +cudnn_frontend::graph::Graph::batchnorm_inference,NO, +cudnn_frontend::graph::Graph::bn_finalize,NO, +cudnn_frontend::graph::Graph::build,NO, +cudnn_frontend::graph::Graph::build_plan_at_index,NO, +cudnn_frontend::graph::Graph::build_plans,NO, +cudnn_frontend::graph::Graph::check_support,NO, +cudnn_frontend::graph::Graph::collect_pre_assigned_uids_,NO, +cudnn_frontend::graph::Graph::conv_dgrad,NO, +cudnn_frontend::graph::Graph::conv_fprop,NO, +cudnn_frontend::graph::Graph::conv_wgrad,NO, +cudnn_frontend::graph::Graph::create_cudnn_tensors_,NO, +cudnn_frontend::graph::Graph::create_execution_plans,NO, +cudnn_frontend::graph::Graph::dbn_weight,NO, +cudnn_frontend::graph::Graph::deselect_behavior_notes,NO, +cudnn_frontend::graph::Graph::deselect_engines,NO, +cudnn_frontend::graph::Graph::deselect_numeric_notes,NO, +cudnn_frontend::graph::Graph::deselect_shared_mem_greater_than,NO, +cudnn_frontend::graph::Graph::deselect_workspace_greater_than,NO, +cudnn_frontend::graph::Graph::deserialize,NO, +cudnn_frontend::graph::Graph::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::Graph::genstats,NO, +cudnn_frontend::graph::Graph::getType,NO, +cudnn_frontend::graph::Graph::get_execution_plan_count,NO, +cudnn_frontend::graph::Graph::instancenorm,NO, +cudnn_frontend::graph::Graph::instancenorm_backward,NO, +cudnn_frontend::graph::Graph::layernorm,NO, +cudnn_frontend::graph::Graph::layernorm_backward,NO, +cudnn_frontend::graph::Graph::output_tensor,NO, +cudnn_frontend::graph::Graph::pass_by_value_tensors_,NO, +cudnn_frontend::graph::Graph::post_validate_node,NO, +cudnn_frontend::graph::Graph::pre_validate_node,NO, +cudnn_frontend::graph::Graph::print,NO, +cudnn_frontend::graph::Graph::rmsnorm,NO, +cudnn_frontend::graph::Graph::rmsnorm_backward,NO, +cudnn_frontend::graph::Graph::scaled_dot_product_flash_attention,NO, +cudnn_frontend::graph::Graph::scaled_dot_product_flash_attention_backward,NO, +cudnn_frontend::graph::Graph::sdpa,NO, +cudnn_frontend::graph::Graph::sdpa_backward,NO, +cudnn_frontend::graph::Graph::sdpa_fp8,NO, +cudnn_frontend::graph::Graph::sdpa_fp8_backward,NO, +cudnn_frontend::graph::Graph::select_behavior_notes,NO, +cudnn_frontend::graph::Graph::select_numeric_notes,NO, +cudnn_frontend::graph::Graph::serialize,NO, +cudnn_frontend::graph::Graph::set_compute_data_type,NO, +cudnn_frontend::graph::Graph::set_intermediate_data_type,NO, +cudnn_frontend::graph::Graph::set_io_data_type,NO, +cudnn_frontend::graph::Graph::set_name,NO, +cudnn_frontend::graph::Graph::set_uids_,NO, +cudnn_frontend::graph::Graph::tensor,NO, +cudnn_frontend::graph::Graph::tensor_like,NO, +cudnn_frontend::graph::INode::autotune,NO, +cudnn_frontend::graph::INode::build_operation_graph,NO, +cudnn_frontend::graph::INode::collect_pre_assigned_uids,NO, +cudnn_frontend::graph::INode::collect_pre_assigned_uids_,NO, +cudnn_frontend::graph::INode::create_cudnn_operations,NO, +cudnn_frontend::graph::INode::create_cudnn_tensors,NO, +cudnn_frontend::graph::INode::create_cudnn_tensors_,NO, +cudnn_frontend::graph::INode::deserialize,NO, +cudnn_frontend::graph::INode::execute,NO, +cudnn_frontend::graph::INode::execute_plan_at_index,NO, +cudnn_frontend::graph::INode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::INode::extend_tensor_map_with_pass_by_value_tensors_,NO, +cudnn_frontend::graph::INode::extend_tensor_map_with_workspace_tensors_,NO, +cudnn_frontend::graph::INode::gather_pass_by_value_tensors_,NO, +cudnn_frontend::graph::INode::gather_workspace_modifications,NO, +cudnn_frontend::graph::INode::getType,NO, +cudnn_frontend::graph::INode::get_autotune_workspace_size,NO, +cudnn_frontend::graph::INode::get_cudnn_workspace_size,NO, +cudnn_frontend::graph::INode::get_fe_workspace_size,NO, +cudnn_frontend::graph::INode::get_fe_workspace_size_node,NO, +cudnn_frontend::graph::INode::get_max_cudnn_workspace_size,NO, +cudnn_frontend::graph::INode::get_workspace_size,NO, +cudnn_frontend::graph::INode::get_workspace_size_plan_at_index,NO, +cudnn_frontend::graph::INode::key,NO, +cudnn_frontend::graph::INode::matmul,NO, +cudnn_frontend::graph::INode::matmul_fp8,NO, +cudnn_frontend::graph::INode::output_tensor,NO, +cudnn_frontend::graph::INode::pass_by_value_tensors_,NO, +cudnn_frontend::graph::INode::pointwise,NO, +cudnn_frontend::graph::INode::post_validate,NO, +cudnn_frontend::graph::INode::post_validate_node,NO, +cudnn_frontend::graph::INode::pre_validate_and_expand_node,NO, +cudnn_frontend::graph::INode::pre_validate_node,NO, +cudnn_frontend::graph::INode::reduction,NO, +cudnn_frontend::graph::INode::resample,NO, +cudnn_frontend::graph::INode::reshape,NO, +cudnn_frontend::graph::INode::rng,NO, +cudnn_frontend::graph::INode::run_auxiliary_kernels,NO, +cudnn_frontend::graph::INode::serialize,NO, +cudnn_frontend::graph::INode::set_uids,NO, +cudnn_frontend::graph::INode::set_uids_,NO, +cudnn_frontend::graph::INode::softmax,NO, +cudnn_frontend::graph::INode::validate,NO, +cudnn_frontend::graph::INode::workspace_modifications_tensors_,NO, +cudnn_frontend::graph::InstanceNormNode::create_cudnn_operations,NO, +cudnn_frontend::graph::InstanceNormNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::InstanceNormNode::getType,NO, +cudnn_frontend::graph::InstanceNormNode::post_validate_node,NO, +cudnn_frontend::graph::InstanceNormNode::pre_validate_node,NO, +cudnn_frontend::graph::InstanceNormNode::serialize,NO, +cudnn_frontend::graph::Instancenorm_attributes::set_epsilon,NO, +cudnn_frontend::graph::Instancenorm_attributes::set_forward_phase,NO, +cudnn_frontend::graph::Instancenorm_backward_attributes::set_saved_mean_and_inv_variance,NO, +cudnn_frontend::graph::LayerNormNode::create_cudnn_operations,NO, +cudnn_frontend::graph::LayerNormNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::LayerNormNode::getType,NO, +cudnn_frontend::graph::LayerNormNode::post_validate_node,NO, +cudnn_frontend::graph::LayerNormNode::pre_validate_node,NO, +cudnn_frontend::graph::LayerNormNode::serialize,NO, +cudnn_frontend::graph::Layernorm_attributes::set_epsilon,NO, +cudnn_frontend::graph::Layernorm_attributes::set_forward_phase,NO, +cudnn_frontend::graph::Layernorm_backward_attributes::set_saved_mean_and_inv_variance,NO, +cudnn_frontend::graph::MatmulFP8Node::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::MatmulFP8Node::getType,NO, +cudnn_frontend::graph::MatmulFP8Node::post_validate_node,NO, +cudnn_frontend::graph::MatmulFP8Node::pre_validate_node,NO, +cudnn_frontend::graph::MatmulFP8Node::serialize,NO, +cudnn_frontend::graph::MatmulNode::create_cudnn_operations,NO, +cudnn_frontend::graph::MatmulNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::MatmulNode::getType,NO, +cudnn_frontend::graph::MatmulNode::post_validate_node,NO, +cudnn_frontend::graph::MatmulNode::pre_validate_node,NO, +cudnn_frontend::graph::MatmulNode::serialize,NO, +cudnn_frontend::graph::Matmul_attributes::set_k_override,NO, +cudnn_frontend::graph::Matmul_attributes::set_m_override,NO, +cudnn_frontend::graph::Matmul_attributes::set_n_override,NO, +cudnn_frontend::graph::Matmul_attributes::set_padding,NO, +cudnn_frontend::graph::Matmul_fp8_attributes::set_padding,NO, +cudnn_frontend::graph::NodeCRTP::collect_pre_assigned_uids_,NO, +cudnn_frontend::graph::NodeCRTP::create_cudnn_tensors_,NO, +cudnn_frontend::graph::NodeCRTP::pass_by_value_tensors_,NO, +cudnn_frontend::graph::NodeCRTP::self,NO, +cudnn_frontend::graph::NodeCRTP::set_uids_,NO, +cudnn_frontend::graph::PointwiseNode::create_cudnn_operations,NO, +cudnn_frontend::graph::PointwiseNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::PointwiseNode::getType,NO, +cudnn_frontend::graph::PointwiseNode::post_validate_node,NO, +cudnn_frontend::graph::PointwiseNode::pre_validate_node,NO, +cudnn_frontend::graph::PointwiseNode::serialize,NO, +cudnn_frontend::graph::Pointwise_attributes::get_axis,NO, +cudnn_frontend::graph::Pointwise_attributes::set_axis,NO, +cudnn_frontend::graph::Pointwise_attributes::set_mode,NO, +cudnn_frontend::graph::Pointwise_attributes::set_relu_lower_clip,NO, +cudnn_frontend::graph::Pointwise_attributes::set_relu_lower_clip_slope,NO, +cudnn_frontend::graph::Pointwise_attributes::set_relu_upper_clip,NO, +cudnn_frontend::graph::RMSNormNode::create_cudnn_operations,NO, +cudnn_frontend::graph::RMSNormNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::RMSNormNode::getType,NO, +cudnn_frontend::graph::RMSNormNode::post_validate_node,NO, +cudnn_frontend::graph::RMSNormNode::pre_validate_node,NO, +cudnn_frontend::graph::RMSNormNode::serialize,NO, +cudnn_frontend::graph::ReductionNode::create_cudnn_operations,NO, +cudnn_frontend::graph::ReductionNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::ReductionNode::getType,NO, +cudnn_frontend::graph::ReductionNode::post_validate_node,NO, +cudnn_frontend::graph::ReductionNode::pre_validate_node,NO, +cudnn_frontend::graph::ReductionNode::serialize,NO, +cudnn_frontend::graph::Reduction_attributes::get_mode,NO, +cudnn_frontend::graph::Reduction_attributes::set_mode,NO, +cudnn_frontend::graph::ResampleNode::create_cudnn_operations,NO, +cudnn_frontend::graph::ResampleNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::ResampleNode::getType,NO, +cudnn_frontend::graph::ResampleNode::post_validate_node,NO, +cudnn_frontend::graph::ResampleNode::pre_validate_node,NO, +cudnn_frontend::graph::ResampleNode::serialize,NO, +cudnn_frontend::graph::Resample_attributes::set_is_inference,NO, +cudnn_frontend::graph::Resample_attributes::set_padding_mode,NO, +cudnn_frontend::graph::Resample_attributes::set_post_padding,NO, +cudnn_frontend::graph::Resample_attributes::set_pre_padding,NO, +cudnn_frontend::graph::Resample_attributes::set_resampling_mode,NO, +cudnn_frontend::graph::Resample_attributes::set_stride,NO, +cudnn_frontend::graph::Resample_attributes::set_window,NO, +cudnn_frontend::graph::ReshapeNode::create_cudnn_operations,NO, +cudnn_frontend::graph::ReshapeNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::ReshapeNode::getType,NO, +cudnn_frontend::graph::ReshapeNode::post_validate_node,NO, +cudnn_frontend::graph::ReshapeNode::pre_validate_node,NO, +cudnn_frontend::graph::ReshapeNode::serialize,NO, +cudnn_frontend::graph::Reshape_attributes::get_dim,NO, +cudnn_frontend::graph::Reshape_attributes::get_stride,NO, +cudnn_frontend::graph::Reshape_attributes::set_dim,NO, +cudnn_frontend::graph::Reshape_attributes::set_stride,NO, +cudnn_frontend::graph::Rmsnorm_attributes::set_bias,NO, +cudnn_frontend::graph::Rmsnorm_attributes::set_epsilon,NO, +cudnn_frontend::graph::Rmsnorm_attributes::set_forward_phase,NO, +cudnn_frontend::graph::Rmsnorm_backward_attributes::has_dbias,NO, +cudnn_frontend::graph::RngNode::create_cudnn_operations,NO, +cudnn_frontend::graph::RngNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::RngNode::getType,NO, +cudnn_frontend::graph::RngNode::post_validate_node,NO, +cudnn_frontend::graph::RngNode::pre_validate_node,NO, +cudnn_frontend::graph::RngNode::serialize,NO, +cudnn_frontend::graph::Rng_attributes::get_bernoulli_probability,NO, +cudnn_frontend::graph::Rng_attributes::get_dim,NO, +cudnn_frontend::graph::Rng_attributes::get_distribution,NO, +cudnn_frontend::graph::Rng_attributes::get_seed,NO, +cudnn_frontend::graph::Rng_attributes::get_stride,NO, +cudnn_frontend::graph::Rng_attributes::set_bernoulli_probability,NO, +cudnn_frontend::graph::Rng_attributes::set_dim,NO, +cudnn_frontend::graph::Rng_attributes::set_distribution,NO, +cudnn_frontend::graph::Rng_attributes::set_seed,NO, +cudnn_frontend::graph::Rng_attributes::set_stride,NO, +cudnn_frontend::graph::SDPABackwardNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::SDPABackwardNode::getType,NO, +cudnn_frontend::graph::SDPABackwardNode::get_fe_workspace_size_node,NO, +cudnn_frontend::graph::SDPABackwardNode::post_validate_node,NO, +cudnn_frontend::graph::SDPABackwardNode::pre_validate_node,NO, +cudnn_frontend::graph::SDPABackwardNode::serialize,NO, +cudnn_frontend::graph::SDPABackwardNode::workspace_modifications_tensors_,NO, +cudnn_frontend::graph::SDPAFP8BackwardNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::SDPAFP8BackwardNode::getType,NO, +cudnn_frontend::graph::SDPAFP8BackwardNode::post_validate_node,NO, +cudnn_frontend::graph::SDPAFP8BackwardNode::pre_validate_node,NO, +cudnn_frontend::graph::SDPAFP8BackwardNode::serialize,NO, +cudnn_frontend::graph::SDPAFP8Node::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::SDPAFP8Node::getType,NO, +cudnn_frontend::graph::SDPAFP8Node::post_validate_node,NO, +cudnn_frontend::graph::SDPAFP8Node::pre_validate_node,NO, +cudnn_frontend::graph::SDPAFP8Node::serialize,NO, +cudnn_frontend::graph::SDPANode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::SDPANode::getType,NO, +cudnn_frontend::graph::SDPANode::get_fe_workspace_size_node,NO, +cudnn_frontend::graph::SDPANode::post_validate_node,NO, +cudnn_frontend::graph::SDPANode::pre_validate_node,NO, +cudnn_frontend::graph::SDPANode::serialize,NO, +cudnn_frontend::graph::SDPANode::workspace_modifications_tensors_,NO, +cudnn_frontend::graph::SDPA_attributes::set_alibi_mask,NO, +cudnn_frontend::graph::SDPA_attributes::set_attn_scale,NO, +cudnn_frontend::graph::SDPA_attributes::set_bias,NO, +cudnn_frontend::graph::SDPA_attributes::set_causal_mask,NO, +cudnn_frontend::graph::SDPA_attributes::set_causal_mask_bottom_right,NO, +cudnn_frontend::graph::SDPA_attributes::set_dropout,NO, +cudnn_frontend::graph::SDPA_attributes::set_is_inference,NO, +cudnn_frontend::graph::SDPA_attributes::set_padding_mask,NO, +cudnn_frontend::graph::SDPA_attributes::set_rng_dump,NO, +cudnn_frontend::graph::SDPA_attributes::set_seq_len_kv,NO, +cudnn_frontend::graph::SDPA_attributes::set_seq_len_q,NO, +cudnn_frontend::graph::SDPA_attributes::set_sliding_window_length,NO, +cudnn_frontend::graph::SDPA_backward_attributes::set_alibi_mask,NO, +cudnn_frontend::graph::SDPA_backward_attributes::set_attn_scale,NO, +cudnn_frontend::graph::SDPA_backward_attributes::set_bias,NO, +cudnn_frontend::graph::SDPA_backward_attributes::set_causal_mask,NO, +cudnn_frontend::graph::SDPA_backward_attributes::set_causal_mask_bottom_right,NO, +cudnn_frontend::graph::SDPA_backward_attributes::set_dbias,NO, +cudnn_frontend::graph::SDPA_backward_attributes::set_deterministic_algorithm,NO, +cudnn_frontend::graph::SDPA_backward_attributes::set_dropout,NO, +cudnn_frontend::graph::SDPA_backward_attributes::set_padding_mask,NO, +cudnn_frontend::graph::SDPA_backward_attributes::set_rng_dump,NO, +cudnn_frontend::graph::SDPA_backward_attributes::set_seq_len_kv,NO, +cudnn_frontend::graph::SDPA_backward_attributes::set_seq_len_q,NO, +cudnn_frontend::graph::SDPA_backward_attributes::set_sliding_window_length,NO, +cudnn_frontend::graph::SDPA_fp8_attributes::set_attn_scale,NO, +cudnn_frontend::graph::SDPA_fp8_attributes::set_causal_mask,NO, +cudnn_frontend::graph::SDPA_fp8_attributes::set_is_inference,NO, +cudnn_frontend::graph::SDPA_fp8_backward_attributes::set_attn_scale,NO, +cudnn_frontend::graph::SDPA_fp8_backward_attributes::set_causal_mask,NO, +cudnn_frontend::graph::SoftmaxNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::SoftmaxNode::getType,NO, +cudnn_frontend::graph::SoftmaxNode::post_validate_node,NO, +cudnn_frontend::graph::SoftmaxNode::pre_validate_node,NO, +cudnn_frontend::graph::SoftmaxNode::serialize,NO, +cudnn_frontend::graph::Softmax_attributes::has_M_Zinv,NO, +cudnn_frontend::graph::Softmax_attributes::has_stats,NO, +cudnn_frontend::graph::Tensor_attributes::clear_uid,NO, +cudnn_frontend::graph::Tensor_attributes::fill_from_context,NO, +cudnn_frontend::graph::Tensor_attributes::get_data_type,NO, +cudnn_frontend::graph::Tensor_attributes::get_dim,NO, +cudnn_frontend::graph::Tensor_attributes::get_is_pass_by_value,NO, +cudnn_frontend::graph::Tensor_attributes::get_is_virtual,NO, +cudnn_frontend::graph::Tensor_attributes::get_name,NO, +cudnn_frontend::graph::Tensor_attributes::get_pass_by_value,NO, +cudnn_frontend::graph::Tensor_attributes::get_ragged_offset,NO, +cudnn_frontend::graph::Tensor_attributes::get_reordering_type,NO, +cudnn_frontend::graph::Tensor_attributes::get_stride,NO, +cudnn_frontend::graph::Tensor_attributes::get_uid,NO, +cudnn_frontend::graph::Tensor_attributes::has_uid,NO, +cudnn_frontend::graph::Tensor_attributes::set_data_type,NO, +cudnn_frontend::graph::Tensor_attributes::set_dim,NO, +cudnn_frontend::graph::Tensor_attributes::set_is_pass_by_value,NO, +cudnn_frontend::graph::Tensor_attributes::set_is_virtual,NO, +cudnn_frontend::graph::Tensor_attributes::set_name,NO, +cudnn_frontend::graph::Tensor_attributes::set_output,NO, +cudnn_frontend::graph::Tensor_attributes::set_ragged_offset,NO, +cudnn_frontend::graph::Tensor_attributes::set_reordering_type,NO, +cudnn_frontend::graph::Tensor_attributes::set_stride,NO, +cudnn_frontend::graph::Tensor_attributes::set_uid,NO, +cudnn_frontend::graph::Tensor_attributes::validate,NO, +cudnn_frontend::graph::WgradNode::create_cudnn_operations,NO, +cudnn_frontend::graph::WgradNode::expand_and_infer_properties_node,NO, +cudnn_frontend::graph::WgradNode::getType,NO, +cudnn_frontend::graph::WgradNode::post_validate_node,NO, +cudnn_frontend::graph::WgradNode::pre_validate_node,NO, +cudnn_frontend::graph::WgradNode::serialize,NO, diff --git a/docs/dev_guide/api-mapping-status/nvSHMEM_API_migration_status.csv b/docs/dev_guide/api-mapping-status/nvSHMEM_API_migration_status.csv index d62439bb3bef..4747ae597daa 100644 --- a/docs/dev_guide/api-mapping-status/nvSHMEM_API_migration_status.csv +++ b/docs/dev_guide/api-mapping-status/nvSHMEM_API_migration_status.csv @@ -32,740 +32,740 @@ nvshmem_team_translate_pe,YES, nvshmem_team_split_strided,YES, nvshmem_team_split_2d,YES, nvshmem_team_destroy,YES, -nvshmem_float_put,NO, -nvshmem_double_put,NO, -nvshmem_char_put,NO, -nvshmem_schar_put,NO, -nvshmem_short_put,NO, -nvshmem_int_put,NO, -nvshmem_long_put,NO, -nvshmem_longlong_put,NO, -nvshmem_uchar_put,NO, -nvshmem_ushort_put,NO, -nvshmem_uint_put,NO, -nvshmem_ulong_put,NO, -nvshmem_ulonglong_put,NO, -nvshmem_int8_put,NO, -nvshmem_int16_put,NO, -nvshmem_int32_put,NO, -nvshmem_int64_put,NO, -nvshmem_uint8_put,NO, -nvshmem_uint16_put,NO, -nvshmem_uint32_put,NO, -nvshmem_uint64_put,NO, -nvshmem_size_put,NO, -nvshmem_ptrdiff_put,NO, -nvshmemx_float_put_on_stream,NO, -nvshmemx_double_put_on_stream,NO, -nvshmemx_char_put_on_stream,NO, -nvshmemx_schar_put_on_stream,NO, -nvshmemx_short_put_on_stream,NO, -nvshmemx_int_put_on_stream,NO, -nvshmemx_long_put_on_stream,NO, -nvshmemx_longlong_put_on_stream,NO, -nvshmemx_uchar_put_on_stream,NO, -nvshmemx_ushort_put_on_stream,NO, -nvshmemx_uint_put_on_stream,NO, -nvshmemx_ulong_put_on_stream,NO, -nvshmemx_ulonglong_put_on_stream,NO, -nvshmemx_int8_put_on_stream,NO, -nvshmemx_int16_put_on_stream,NO, -nvshmemx_int32_put_on_stream,NO, -nvshmemx_int64_put_on_stream,NO, -nvshmemx_uint8_put_on_stream,NO, -nvshmemx_uint16_put_on_stream,NO, -nvshmemx_uint32_put_on_stream,NO, -nvshmemx_uint64_put_on_stream,NO, -nvshmemx_size_put_on_stream,NO, -nvshmemx_ptrdiff_put_on_stream,NO, -nvshmemx_float_put_block,NO, -nvshmemx_double_put_block,NO, -nvshmemx_char_put_block,NO, -nvshmemx_schar_put_block,NO, -nvshmemx_short_put_block,NO, -nvshmemx_int_put_block,NO, -nvshmemx_long_put_block,NO, -nvshmemx_longlong_put_block,NO, -nvshmemx_uchar_put_block,NO, -nvshmemx_ushort_put_block,NO, -nvshmemx_uint_put_block,NO, -nvshmemx_ulong_put_block,NO, -nvshmemx_ulonglong_put_block,NO, -nvshmemx_int8_put_block,NO, -nvshmemx_int16_put_block,NO, -nvshmemx_int32_put_block,NO, -nvshmemx_int64_put_block,NO, -nvshmemx_uint8_put_block,NO, -nvshmemx_uint16_put_block,NO, -nvshmemx_uint32_put_block,NO, -nvshmemx_uint64_put_block,NO, -nvshmemx_size_put_block,NO, -nvshmemx_ptrdiff_put_block,NO, -nvshmemx_float_put_warp,NO, -nvshmemx_double_put_warp,NO, -nvshmemx_char_put_warp,NO, -nvshmemx_schar_put_warp,NO, -nvshmemx_short_put_warp,NO, -nvshmemx_int_put_warp,NO, -nvshmemx_long_put_warp,NO, -nvshmemx_longlong_put_warp,NO, -nvshmemx_uchar_put_warp,NO, -nvshmemx_ushort_put_warp,NO, -nvshmemx_uint_put_warp,NO, -nvshmemx_ulong_put_warp,NO, -nvshmemx_ulonglong_put_warp,NO, -nvshmemx_int8_put_warp,NO, -nvshmemx_int16_put_warp,NO, -nvshmemx_int32_put_warp,NO, -nvshmemx_int64_put_warp,NO, -nvshmemx_uint8_put_warp,NO, -nvshmemx_uint16_put_warp,NO, -nvshmemx_uint32_put_warp,NO, -nvshmemx_uint64_put_warp,NO, -nvshmemx_size_put_warp,NO, -nvshmemx_ptrdiff_put_warp,NO, -nvshmem_put8,NO, -nvshmem_put16,NO, -nvshmem_put32,NO, -nvshmem_put64,NO, -nvshmem_put128,NO, -nvshmemx_put8_on_stream,NO, -nvshmemx_put16_on_stream,NO, -nvshmemx_put32_on_stream,NO, -nvshmemx_put64_on_stream,NO, -nvshmemx_put128_on_stream,NO, -nvshmemx_put8_block,NO, -nvshmemx_put16_block,NO, -nvshmemx_put32_block,NO, -nvshmemx_put64_block,NO, -nvshmemx_put128_block,NO, -nvshmemx_put8_warp,NO, -nvshmemx_put16_warp,NO, -nvshmemx_put32_warp,NO, -nvshmemx_put64_warp,NO, -nvshmemx_put128_warp,NO, -nvshmem_putmem,NO, -nvshmemx_putmem_on_stream,NO, -nvshmemx_putmem_block,NO, -nvshmemx_putmem_warp,NO, -nvshmem_float_p,NO, -nvshmem_double_p,NO, -nvshmem_char_p,NO, -nvshmem_schar_p,NO, -nvshmem_short_p,NO, -nvshmem_int_p,NO, -nvshmem_long_p,NO, -nvshmem_longlong_p,NO, -nvshmem_uchar_p,NO, -nvshmem_ushort_p,NO, -nvshmem_uint_p,NO, -nvshmem_ulong_p,NO, -nvshmem_ulonglong_p,NO, -nvshmem_int8_p,NO, -nvshmem_int16_p,NO, -nvshmem_int32_p,NO, -nvshmem_int64_p,NO, -nvshmem_uint8_p,NO, -nvshmem_uint16_p,NO, -nvshmem_uint32_p,NO, -nvshmem_uint64_p,NO, -nvshmem_size_p,NO, -nvshmem_ptrdiff_p,NO, -nvshmem_float_iput,NO, -nvshmem_double_iput,NO, -nvshmem_char_iput,NO, -nvshmem_schar_iput,NO, -nvshmem_short_iput,NO, -nvshmem_int_iput,NO, -nvshmem_long_iput,NO, -nvshmem_longlong_iput,NO, -nvshmem_uchar_iput,NO, -nvshmem_ushort_iput,NO, -nvshmem_uint_iput,NO, -nvshmem_ulong_iput,NO, -nvshmem_ulonglong_iput,NO, -nvshmem_int8_iput,NO, -nvshmem_int16_iput,NO, -nvshmem_int32_iput,NO, -nvshmem_int64_iput,NO, -nvshmem_uint8_iput,NO, -nvshmem_uint16_iput,NO, -nvshmem_uint32_iput,NO, -nvshmem_uint64_iput,NO, -nvshmem_size_iput,NO, -nvshmem_ptrdiff_iput,NO, -nvshmemx_float_iput_on_stream,NO, -nvshmemx_double_iput_on_stream,NO, -nvshmemx_char_iput_on_stream,NO, -nvshmemx_schar_iput_on_stream,NO, -nvshmemx_short_iput_on_stream,NO, -nvshmemx_int_iput_on_stream,NO, -nvshmemx_long_iput_on_stream,NO, -nvshmemx_longlong_iput_on_stream,NO, -nvshmemx_uchar_iput_on_stream,NO, -nvshmemx_ushort_iput_on_stream,NO, -nvshmemx_uint_iput_on_stream,NO, -nvshmemx_ulong_iput_on_stream,NO, -nvshmemx_ulonglong_iput_on_stream,NO, -nvshmemx_int8_iput_on_stream,NO, -nvshmemx_int16_iput_on_stream,NO, -nvshmemx_int32_iput_on_stream,NO, -nvshmemx_int64_iput_on_stream,NO, -nvshmemx_uint8_iput_on_stream,NO, -nvshmemx_uint16_iput_on_stream,NO, -nvshmemx_uint32_iput_on_stream,NO, -nvshmemx_uint64_iput_on_stream,NO, -nvshmemx_size_iput_on_stream,NO, -nvshmemx_ptrdiff_iput_on_stream,NO, -nvshmemx_float_iput_block,NO, -nvshmemx_double_iput_block,NO, -nvshmemx_char_iput_block,NO, -nvshmemx_schar_iput_block,NO, -nvshmemx_short_iput_block,NO, -nvshmemx_int_iput_block,NO, -nvshmemx_long_iput_block,NO, -nvshmemx_longlong_iput_block,NO, -nvshmemx_uchar_iput_block,NO, -nvshmemx_ushort_iput_block,NO, -nvshmemx_uint_iput_block,NO, -nvshmemx_ulong_iput_block,NO, -nvshmemx_ulonglong_iput_block,NO, -nvshmemx_int8_iput_block,NO, -nvshmemx_int16_iput_block,NO, -nvshmemx_int32_iput_block,NO, -nvshmemx_int64_iput_block,NO, -nvshmemx_uint8_iput_block,NO, -nvshmemx_uint16_iput_block,NO, -nvshmemx_uint32_iput_block,NO, -nvshmemx_uint64_iput_block,NO, -nvshmemx_size_iput_block,NO, -nvshmemx_ptrdiff_iput_block,NO, -nvshmemx_float_iput_warp,NO, -nvshmemx_double_iput_warp,NO, -nvshmemx_char_iput_warp,NO, -nvshmemx_schar_iput_warp,NO, -nvshmemx_short_iput_warp,NO, -nvshmemx_int_iput_warp,NO, -nvshmemx_long_iput_warp,NO, -nvshmemx_longlong_iput_warp,NO, -nvshmemx_uchar_iput_warp,NO, -nvshmemx_ushort_iput_warp,NO, -nvshmemx_uint_iput_warp,NO, -nvshmemx_ulong_iput_warp,NO, -nvshmemx_ulonglong_iput_warp,NO, -nvshmemx_int8_iput_warp,NO, -nvshmemx_int16_iput_warp,NO, -nvshmemx_int32_iput_warp,NO, -nvshmemx_int64_iput_warp,NO, -nvshmemx_uint8_iput_warp,NO, -nvshmemx_uint16_iput_warp,NO, -nvshmemx_uint32_iput_warp,NO, -nvshmemx_uint64_iput_warp,NO, -nvshmemx_size_iput_warp,NO, -nvshmemx_ptrdiff_iput_warp,NO, -nvshmem_iput8,NO, -nvshmem_iput16,NO, -nvshmem_iput32,NO, -nvshmem_iput64,NO, -nvshmem_iput128,NO, -nvshmemx_iput8_on_stream,NO, -nvshmemx_iput16_on_stream,NO, -nvshmemx_iput32_on_stream,NO, -nvshmemx_iput64_on_stream,NO, -nvshmemx_iput128_on_stream,NO, -nvshmemx_iput8_block,NO, -nvshmemx_iput16_block,NO, -nvshmemx_iput32_block,NO, -nvshmemx_iput64_block,NO, -nvshmemx_iput128_block,NO, -nvshmemx_iput8_warp,NO, -nvshmemx_iput16_warp,NO, -nvshmemx_iput32_warp,NO, -nvshmemx_iput64_warp,NO, -nvshmemx_iput128_warp,NO, -nvshmem_float_get,NO, -nvshmem_double_get,NO, -nvshmem_char_get,NO, -nvshmem_schar_get,NO, -nvshmem_short_get,NO, -nvshmem_int_get,NO, -nvshmem_long_get,NO, -nvshmem_longlong_get,NO, -nvshmem_uchar_get,NO, -nvshmem_ushort_get,NO, -nvshmem_uint_get,NO, -nvshmem_ulong_get,NO, -nvshmem_ulonglong_get,NO, -nvshmem_int8_get,NO, -nvshmem_int16_get,NO, -nvshmem_int32_get,NO, -nvshmem_int64_get,NO, -nvshmem_uint8_get,NO, -nvshmem_uint16_get,NO, -nvshmem_uint32_get,NO, -nvshmem_uint64_get,NO, -nvshmem_size_get,NO, -nvshmem_ptrdiff_get,NO, -nvshmemx_float_get_on_stream,NO, -nvshmemx_double_get_on_stream,NO, -nvshmemx_char_get_on_stream,NO, -nvshmemx_schar_get_on_stream,NO, -nvshmemx_short_get_on_stream,NO, -nvshmemx_int_get_on_stream,NO, -nvshmemx_long_get_on_stream,NO, -nvshmemx_longlong_get_on_stream,NO, -nvshmemx_uchar_get_on_stream,NO, -nvshmemx_ushort_get_on_stream,NO, -nvshmemx_uint_get_on_stream,NO, -nvshmemx_ulong_get_on_stream,NO, -nvshmemx_ulonglong_get_on_stream,NO, -nvshmemx_int8_get_on_stream,NO, -nvshmemx_int16_get_on_stream,NO, -nvshmemx_int32_get_on_stream,NO, -nvshmemx_int64_get_on_stream,NO, -nvshmemx_uint8_get_on_stream,NO, -nvshmemx_uint16_get_on_stream,NO, -nvshmemx_uint32_get_on_stream,NO, -nvshmemx_uint64_get_on_stream,NO, -nvshmemx_size_get_on_stream,NO, -nvshmemx_ptrdiff_get_on_stream,NO, -nvshmemx_float_get_block,NO, -nvshmemx_double_get_block,NO, -nvshmemx_char_get_block,NO, -nvshmemx_schar_get_block,NO, -nvshmemx_short_get_block,NO, -nvshmemx_int_get_block,NO, -nvshmemx_long_get_block,NO, -nvshmemx_longlong_get_block,NO, -nvshmemx_uchar_get_block,NO, -nvshmemx_ushort_get_block,NO, -nvshmemx_uint_get_block,NO, -nvshmemx_ulong_get_block,NO, -nvshmemx_ulonglong_get_block,NO, -nvshmemx_int8_get_block,NO, -nvshmemx_int16_get_block,NO, -nvshmemx_int32_get_block,NO, -nvshmemx_int64_get_block,NO, -nvshmemx_uint8_get_block,NO, -nvshmemx_uint16_get_block,NO, -nvshmemx_uint32_get_block,NO, -nvshmemx_uint64_get_block,NO, -nvshmemx_size_get_block,NO, -nvshmemx_ptrdiff_get_block,NO, -nvshmemx_float_get_warp,NO, -nvshmemx_double_get_warp,NO, -nvshmemx_char_get_warp,NO, -nvshmemx_schar_get_warp,NO, -nvshmemx_short_get_warp,NO, -nvshmemx_int_get_warp,NO, -nvshmemx_long_get_warp,NO, -nvshmemx_longlong_get_warp,NO, -nvshmemx_uchar_get_warp,NO, -nvshmemx_ushort_get_warp,NO, -nvshmemx_uint_get_warp,NO, -nvshmemx_ulong_get_warp,NO, -nvshmemx_ulonglong_get_warp,NO, -nvshmemx_int8_get_warp,NO, -nvshmemx_int16_get_warp,NO, -nvshmemx_int32_get_warp,NO, -nvshmemx_int64_get_warp,NO, -nvshmemx_uint8_get_warp,NO, -nvshmemx_uint16_get_warp,NO, -nvshmemx_uint32_get_warp,NO, -nvshmemx_uint64_get_warp,NO, -nvshmemx_size_get_warp,NO, -nvshmemx_ptrdiff_get_warp,NO, -nvshmem_get8,NO, -nvshmem_get16,NO, -nvshmem_get32,NO, -nvshmem_get64,NO, -nvshmem_get128,NO, -nvshmemx_get8_on_stream,NO, -nvshmemx_get16_on_stream,NO, -nvshmemx_get32_on_stream,NO, -nvshmemx_get64_on_stream,NO, -nvshmemx_get128_on_stream,NO, -nvshmemx_get8_block,NO, -nvshmemx_get16_block,NO, -nvshmemx_get32_block,NO, -nvshmemx_get64_block,NO, -nvshmemx_get128_block,NO, -nvshmemx_get8_warp,NO, -nvshmemx_get16_warp,NO, -nvshmemx_get32_warp,NO, -nvshmemx_get64_warp,NO, -nvshmemx_get128_warp,NO, -nvshmem_getmem,NO, -nvshmemx_getmem_on_stream,NO, -nvshmemx_getmem_block,NO, -nvshmemx_getmem_warp,NO, -nvshmem_float_g,NO, -nvshmem_double_g,NO, -nvshmem_char_g,NO, -nvshmem_schar_g,NO, -nvshmem_short_g,NO, -nvshmem_int_g,NO, -nvshmem_long_g,NO, -nvshmem_longlong_g,NO, -nvshmem_uchar_g,NO, -nvshmem_ushort_g,NO, -nvshmem_uint_g,NO, -nvshmem_ulong_g,NO, -nvshmem_ulonglong_g,NO, -nvshmem_int8_g,NO, -nvshmem_int16_g,NO, -nvshmem_int32_g,NO, -nvshmem_int64_g,NO, -nvshmem_uint8_g,NO, -nvshmem_uint16_g,NO, -nvshmem_uint32_g,NO, -nvshmem_uint64_g,NO, -nvshmem_size_g,NO, -nvshmem_ptrdiff_g,NO, -nvshmem_float_iget,NO, -nvshmem_double_iget,NO, -nvshmem_char_iget,NO, -nvshmem_schar_iget,NO, -nvshmem_short_iget,NO, -nvshmem_int_iget,NO, -nvshmem_long_iget,NO, -nvshmem_longlong_iget,NO, -nvshmem_uchar_iget,NO, -nvshmem_ushort_iget,NO, -nvshmem_uint_iget,NO, -nvshmem_ulong_iget,NO, -nvshmem_ulonglong_iget,NO, -nvshmem_int8_iget,NO, -nvshmem_int16_iget,NO, -nvshmem_int32_iget,NO, -nvshmem_int64_iget,NO, -nvshmem_uint8_iget,NO, -nvshmem_uint16_iget,NO, -nvshmem_uint32_iget,NO, -nvshmem_uint64_iget,NO, -nvshmem_size_iget,NO, -nvshmem_ptrdiff_iget,NO, -nvshmemx_float_iget_on_stream,NO, -nvshmemx_double_iget_on_stream,NO, -nvshmemx_char_iget_on_stream,NO, -nvshmemx_schar_iget_on_stream,NO, -nvshmemx_short_iget_on_stream,NO, -nvshmemx_int_iget_on_stream,NO, -nvshmemx_long_iget_on_stream,NO, -nvshmemx_longlong_iget_on_stream,NO, -nvshmemx_uchar_iget_on_stream,NO, -nvshmemx_ushort_iget_on_stream,NO, -nvshmemx_uint_iget_on_stream,NO, -nvshmemx_ulong_iget_on_stream,NO, -nvshmemx_ulonglong_iget_on_stream,NO, -nvshmemx_int8_iget_on_stream,NO, -nvshmemx_int16_iget_on_stream,NO, -nvshmemx_int32_iget_on_stream,NO, -nvshmemx_int64_iget_on_stream,NO, -nvshmemx_uint8_iget_on_stream,NO, -nvshmemx_uint16_iget_on_stream,NO, -nvshmemx_uint32_iget_on_stream,NO, -nvshmemx_uint64_iget_on_stream,NO, -nvshmemx_size_iget_on_stream,NO, -nvshmemx_ptrdiff_iget_on_stream,NO, -nvshmemx_float_iget_block,NO, -nvshmemx_double_iget_block,NO, -nvshmemx_char_iget_block,NO, -nvshmemx_schar_iget_block,NO, -nvshmemx_short_iget_block,NO, -nvshmemx_int_iget_block,NO, -nvshmemx_long_iget_block,NO, -nvshmemx_longlong_iget_block,NO, -nvshmemx_uchar_iget_block,NO, -nvshmemx_ushort_iget_block,NO, -nvshmemx_uint_iget_block,NO, -nvshmemx_ulong_iget_block,NO, -nvshmemx_ulonglong_iget_block,NO, -nvshmemx_int8_iget_block,NO, -nvshmemx_int16_iget_block,NO, -nvshmemx_int32_iget_block,NO, -nvshmemx_int64_iget_block,NO, -nvshmemx_uint8_iget_block,NO, -nvshmemx_uint16_iget_block,NO, -nvshmemx_uint32_iget_block,NO, -nvshmemx_uint64_iget_block,NO, -nvshmemx_size_iget_block,NO, -nvshmemx_ptrdiff_iget_block,NO, -nvshmemx_float_iget_warp,NO, -nvshmemx_double_iget_warp,NO, -nvshmemx_char_iget_warp,NO, -nvshmemx_schar_iget_warp,NO, -nvshmemx_short_iget_warp,NO, -nvshmemx_int_iget_warp,NO, -nvshmemx_long_iget_warp,NO, -nvshmemx_longlong_iget_warp,NO, -nvshmemx_uchar_iget_warp,NO, -nvshmemx_ushort_iget_warp,NO, -nvshmemx_uint_iget_warp,NO, -nvshmemx_ulong_iget_warp,NO, -nvshmemx_ulonglong_iget_warp,NO, -nvshmemx_int8_iget_warp,NO, -nvshmemx_int16_iget_warp,NO, -nvshmemx_int32_iget_warp,NO, -nvshmemx_int64_iget_warp,NO, -nvshmemx_uint8_iget_warp,NO, -nvshmemx_uint16_iget_warp,NO, -nvshmemx_uint32_iget_warp,NO, -nvshmemx_uint64_iget_warp,NO, -nvshmemx_size_iget_warp,NO, -nvshmemx_ptrdiff_iget_warp,NO, -nvshmem_iget8,NO, -nvshmem_iget16,NO, -nvshmem_iget32,NO, -nvshmem_iget64,NO, -nvshmem_iget128,NO, -nvshmemx_iget8_on_stream,NO, -nvshmemx_iget16_on_stream,NO, -nvshmemx_iget32_on_stream,NO, -nvshmemx_iget64_on_stream,NO, -nvshmemx_iget128_on_stream,NO, -nvshmemx_iget8_block,NO, -nvshmemx_iget16_block,NO, -nvshmemx_iget32_block,NO, -nvshmemx_iget64_block,NO, -nvshmemx_iget128_block,NO, -nvshmemx_iget8_warp,NO, -nvshmemx_iget16_warp,NO, -nvshmemx_iget32_warp,NO, -nvshmemx_iget64_warp,NO, -nvshmemx_iget128_warp,NO, -nvshmem_float_put_nbi,NO, -nvshmem_double_put_nbi,NO, -nvshmem_char_put_nbi,NO, -nvshmem_schar_put_nbi,NO, -nvshmem_short_put_nbi,NO, -nvshmem_int_put_nbi,NO, -nvshmem_long_put_nbi,NO, -nvshmem_longlong_put_nbi,NO, -nvshmem_uchar_put_nbi,NO, -nvshmem_ushort_put_nbi,NO, -nvshmem_uint_put_nbi,NO, -nvshmem_ulong_put_nbi,NO, -nvshmem_ulonglong_put_nbi,NO, -nvshmem_int8_put_nbi,NO, -nvshmem_int16_put_nbi,NO, -nvshmem_int32_put_nbi,NO, -nvshmem_int64_put_nbi,NO, -nvshmem_uint8_put_nbi,NO, -nvshmem_uint16_put_nbi,NO, -nvshmem_uint32_put_nbi,NO, -nvshmem_uint64_put_nbi,NO, -nvshmem_size_put_nbi,NO, -nvshmem_ptrdiff_put_nbi,NO, -nvshmemx_float_put_nbi_on_stream,NO, -nvshmemx_double_put_nbi_on_stream,NO, -nvshmemx_char_put_nbi_on_stream,NO, -nvshmemx_schar_put_nbi_on_stream,NO, -nvshmemx_short_put_nbi_on_stream,NO, -nvshmemx_int_put_nbi_on_stream,NO, -nvshmemx_long_put_nbi_on_stream,NO, -nvshmemx_longlong_put_nbi_on_stream,NO, -nvshmemx_uchar_put_nbi_on_stream,NO, -nvshmemx_ushort_put_nbi_on_stream,NO, -nvshmemx_uint_put_nbi_on_stream,NO, -nvshmemx_ulong_put_nbi_on_stream,NO, -nvshmemx_ulonglong_put_nbi_on_stream,NO, -nvshmemx_int8_put_nbi_on_stream,NO, -nvshmemx_int16_put_nbi_on_stream,NO, -nvshmemx_int32_put_nbi_on_stream,NO, -nvshmemx_int64_put_nbi_on_stream,NO, -nvshmemx_uint8_put_nbi_on_stream,NO, -nvshmemx_uint16_put_nbi_on_stream,NO, -nvshmemx_uint32_put_nbi_on_stream,NO, -nvshmemx_uint64_put_nbi_on_stream,NO, -nvshmemx_size_put_nbi_on_stream,NO, -nvshmemx_ptrdiff_put_nbi_on_stream,NO, -nvshmemx_float_put_nbi_block,NO, -nvshmemx_double_put_nbi_block,NO, -nvshmemx_char_put_nbi_block,NO, -nvshmemx_schar_put_nbi_block,NO, -nvshmemx_short_put_nbi_block,NO, -nvshmemx_int_put_nbi_block,NO, -nvshmemx_long_put_nbi_block,NO, -nvshmemx_longlong_put_nbi_block,NO, -nvshmemx_uchar_put_nbi_block,NO, -nvshmemx_ushort_put_nbi_block,NO, -nvshmemx_uint_put_nbi_block,NO, -nvshmemx_ulong_put_nbi_block,NO, -nvshmemx_ulonglong_put_nbi_block,NO, -nvshmemx_int8_put_nbi_block,NO, -nvshmemx_int16_put_nbi_block,NO, -nvshmemx_int32_put_nbi_block,NO, -nvshmemx_int64_put_nbi_block,NO, -nvshmemx_uint8_put_nbi_block,NO, -nvshmemx_uint16_put_nbi_block,NO, -nvshmemx_uint32_put_nbi_block,NO, -nvshmemx_uint64_put_nbi_block,NO, -nvshmemx_size_put_nbi_block,NO, -nvshmemx_ptrdiff_put_nbi_block,NO, -nvshmemx_float_put_nbi_warp,NO, -nvshmemx_double_put_nbi_warp,NO, -nvshmemx_char_put_nbi_warp,NO, -nvshmemx_schar_put_nbi_warp,NO, -nvshmemx_short_put_nbi_warp,NO, -nvshmemx_int_put_nbi_warp,NO, -nvshmemx_long_put_nbi_warp,NO, -nvshmemx_longlong_put_nbi_warp,NO, -nvshmemx_uchar_put_nbi_warp,NO, -nvshmemx_ushort_put_nbi_warp,NO, -nvshmemx_uint_put_nbi_warp,NO, -nvshmemx_ulong_put_nbi_warp,NO, -nvshmemx_ulonglong_put_nbi_warp,NO, -nvshmemx_int8_put_nbi_warp,NO, -nvshmemx_int16_put_nbi_warp,NO, -nvshmemx_int32_put_nbi_warp,NO, -nvshmemx_int64_put_nbi_warp,NO, -nvshmemx_uint8_put_nbi_warp,NO, -nvshmemx_uint16_put_nbi_warp,NO, -nvshmemx_uint32_put_nbi_warp,NO, -nvshmemx_uint64_put_nbi_warp,NO, -nvshmemx_size_put_nbi_warp,NO, -nvshmemx_ptrdiff_put_nbi_warp,NO, -nvshmem_put8_nbi,NO, -nvshmem_put16_nbi,NO, -nvshmem_put32_nbi,NO, -nvshmem_put64_nbi,NO, -nvshmem_put128_nbi,NO, -nvshmemx_put8_nbi_on_stream,NO, -nvshmemx_put16_nbi_on_stream,NO, -nvshmemx_put32_nbi_on_stream,NO, -nvshmemx_put64_nbi_on_stream,NO, -nvshmemx_put128_nbi_on_stream,NO, -nvshmemx_put8_nbi_block,NO, -nvshmemx_put16_nbi_block,NO, -nvshmemx_put32_nbi_block,NO, -nvshmemx_put64_nbi_block,NO, -nvshmemx_put128_nbi_block,NO, -nvshmemx_put8_nbi_warp,NO, -nvshmemx_put16_nbi_warp,NO, -nvshmemx_put32_nbi_warp,NO, -nvshmemx_put64_nbi_warp,NO, -nvshmemx_put128_nbi_warp,NO, +nvshmem_float_put,YES, +nvshmem_double_put,YES, +nvshmem_char_put,YES, +nvshmem_schar_put,YES, +nvshmem_short_put,YES, +nvshmem_int_put,YES, +nvshmem_long_put,YES, +nvshmem_longlong_put,YES, +nvshmem_uchar_put,YES, +nvshmem_ushort_put,YES, +nvshmem_uint_put,YES, +nvshmem_ulong_put,YES, +nvshmem_ulonglong_put,YES, +nvshmem_int8_put,YES, +nvshmem_int16_put,YES, +nvshmem_int32_put,YES, +nvshmem_int64_put,YES, +nvshmem_uint8_put,YES, +nvshmem_uint16_put,YES, +nvshmem_uint32_put,YES, +nvshmem_uint64_put,YES, +nvshmem_size_put,YES, +nvshmem_ptrdiff_put,YES, +nvshmemx_float_put_on_stream,YES, +nvshmemx_double_put_on_stream,YES, +nvshmemx_char_put_on_stream,YES, +nvshmemx_schar_put_on_stream,YES, +nvshmemx_short_put_on_stream,YES, +nvshmemx_int_put_on_stream,YES, +nvshmemx_long_put_on_stream,YES, +nvshmemx_longlong_put_on_stream,YES, +nvshmemx_uchar_put_on_stream,YES, +nvshmemx_ushort_put_on_stream,YES, +nvshmemx_uint_put_on_stream,YES, +nvshmemx_ulong_put_on_stream,YES, +nvshmemx_ulonglong_put_on_stream,YES, +nvshmemx_int8_put_on_stream,YES, +nvshmemx_int16_put_on_stream,YES, +nvshmemx_int32_put_on_stream,YES, +nvshmemx_int64_put_on_stream,YES, +nvshmemx_uint8_put_on_stream,YES, +nvshmemx_uint16_put_on_stream,YES, +nvshmemx_uint32_put_on_stream,YES, +nvshmemx_uint64_put_on_stream,YES, +nvshmemx_size_put_on_stream,YES, +nvshmemx_ptrdiff_put_on_stream,YES, +nvshmemx_float_put_block,YES, +nvshmemx_double_put_block,YES, +nvshmemx_char_put_block,YES, +nvshmemx_schar_put_block,YES, +nvshmemx_short_put_block,YES, +nvshmemx_int_put_block,YES, +nvshmemx_long_put_block,YES, +nvshmemx_longlong_put_block,YES, +nvshmemx_uchar_put_block,YES, +nvshmemx_ushort_put_block,YES, +nvshmemx_uint_put_block,YES, +nvshmemx_ulong_put_block,YES, +nvshmemx_ulonglong_put_block,YES, +nvshmemx_int8_put_block,YES, +nvshmemx_int16_put_block,YES, +nvshmemx_int32_put_block,YES, +nvshmemx_int64_put_block,YES, +nvshmemx_uint8_put_block,YES, +nvshmemx_uint16_put_block,YES, +nvshmemx_uint32_put_block,YES, +nvshmemx_uint64_put_block,YES, +nvshmemx_size_put_block,YES, +nvshmemx_ptrdiff_put_block,YES, +nvshmemx_float_put_warp,YES, +nvshmemx_double_put_warp,YES, +nvshmemx_char_put_warp,YES, +nvshmemx_schar_put_warp,YES, +nvshmemx_short_put_warp,YES, +nvshmemx_int_put_warp,YES, +nvshmemx_long_put_warp,YES, +nvshmemx_longlong_put_warp,YES, +nvshmemx_uchar_put_warp,YES, +nvshmemx_ushort_put_warp,YES, +nvshmemx_uint_put_warp,YES, +nvshmemx_ulong_put_warp,YES, +nvshmemx_ulonglong_put_warp,YES, +nvshmemx_int8_put_warp,YES, +nvshmemx_int16_put_warp,YES, +nvshmemx_int32_put_warp,YES, +nvshmemx_int64_put_warp,YES, +nvshmemx_uint8_put_warp,YES, +nvshmemx_uint16_put_warp,YES, +nvshmemx_uint32_put_warp,YES, +nvshmemx_uint64_put_warp,YES, +nvshmemx_size_put_warp,YES, +nvshmemx_ptrdiff_put_warp,YES, +nvshmem_put8,YES, +nvshmem_put16,YES, +nvshmem_put32,YES, +nvshmem_put64,YES, +nvshmem_put128,YES, +nvshmemx_put8_on_stream,YES, +nvshmemx_put16_on_stream,YES, +nvshmemx_put32_on_stream,YES, +nvshmemx_put64_on_stream,YES, +nvshmemx_put128_on_stream,YES, +nvshmemx_put8_block,YES, +nvshmemx_put16_block,YES, +nvshmemx_put32_block,YES, +nvshmemx_put64_block,YES, +nvshmemx_put128_block,YES, +nvshmemx_put8_warp,YES, +nvshmemx_put16_warp,YES, +nvshmemx_put32_warp,YES, +nvshmemx_put64_warp,YES, +nvshmemx_put128_warp,YES, +nvshmem_putmem,YES, +nvshmemx_putmem_on_stream,YES, +nvshmemx_putmem_block,YES, +nvshmemx_putmem_warp,YES, +nvshmem_float_p,YES, +nvshmem_double_p,YES, +nvshmem_char_p,YES, +nvshmem_schar_p,YES, +nvshmem_short_p,YES, +nvshmem_int_p,YES, +nvshmem_long_p,YES, +nvshmem_longlong_p,YES, +nvshmem_uchar_p,YES, +nvshmem_ushort_p,YES, +nvshmem_uint_p,YES, +nvshmem_ulong_p,YES, +nvshmem_ulonglong_p,YES, +nvshmem_int8_p,YES, +nvshmem_int16_p,YES, +nvshmem_int32_p,YES, +nvshmem_int64_p,YES, +nvshmem_uint8_p,YES, +nvshmem_uint16_p,YES, +nvshmem_uint32_p,YES, +nvshmem_uint64_p,YES, +nvshmem_size_p,YES, +nvshmem_ptrdiff_p,YES, +nvshmem_float_iput,YES, +nvshmem_double_iput,YES, +nvshmem_char_iput,YES, +nvshmem_schar_iput,YES, +nvshmem_short_iput,YES, +nvshmem_int_iput,YES, +nvshmem_long_iput,YES, +nvshmem_longlong_iput,YES, +nvshmem_uchar_iput,YES, +nvshmem_ushort_iput,YES, +nvshmem_uint_iput,YES, +nvshmem_ulong_iput,YES, +nvshmem_ulonglong_iput,YES, +nvshmem_int8_iput,YES, +nvshmem_int16_iput,YES, +nvshmem_int32_iput,YES, +nvshmem_int64_iput,YES, +nvshmem_uint8_iput,YES, +nvshmem_uint16_iput,YES, +nvshmem_uint32_iput,YES, +nvshmem_uint64_iput,YES, +nvshmem_size_iput,YES, +nvshmem_ptrdiff_iput,YES, +nvshmemx_float_iput_on_stream,YES, +nvshmemx_double_iput_on_stream,YES, +nvshmemx_char_iput_on_stream,YES, +nvshmemx_schar_iput_on_stream,YES, +nvshmemx_short_iput_on_stream,YES, +nvshmemx_int_iput_on_stream,YES, +nvshmemx_long_iput_on_stream,YES, +nvshmemx_longlong_iput_on_stream,YES, +nvshmemx_uchar_iput_on_stream,YES, +nvshmemx_ushort_iput_on_stream,YES, +nvshmemx_uint_iput_on_stream,YES, +nvshmemx_ulong_iput_on_stream,YES, +nvshmemx_ulonglong_iput_on_stream,YES, +nvshmemx_int8_iput_on_stream,YES, +nvshmemx_int16_iput_on_stream,YES, +nvshmemx_int32_iput_on_stream,YES, +nvshmemx_int64_iput_on_stream,YES, +nvshmemx_uint8_iput_on_stream,YES, +nvshmemx_uint16_iput_on_stream,YES, +nvshmemx_uint32_iput_on_stream,YES, +nvshmemx_uint64_iput_on_stream,YES, +nvshmemx_size_iput_on_stream,YES, +nvshmemx_ptrdiff_iput_on_stream,YES, +nvshmemx_float_iput_block,YES, +nvshmemx_double_iput_block,YES, +nvshmemx_char_iput_block,YES, +nvshmemx_schar_iput_block,YES, +nvshmemx_short_iput_block,YES, +nvshmemx_int_iput_block,YES, +nvshmemx_long_iput_block,YES, +nvshmemx_longlong_iput_block,YES, +nvshmemx_uchar_iput_block,YES, +nvshmemx_ushort_iput_block,YES, +nvshmemx_uint_iput_block,YES, +nvshmemx_ulong_iput_block,YES, +nvshmemx_ulonglong_iput_block,YES, +nvshmemx_int8_iput_block,YES, +nvshmemx_int16_iput_block,YES, +nvshmemx_int32_iput_block,YES, +nvshmemx_int64_iput_block,YES, +nvshmemx_uint8_iput_block,YES, +nvshmemx_uint16_iput_block,YES, +nvshmemx_uint32_iput_block,YES, +nvshmemx_uint64_iput_block,YES, +nvshmemx_size_iput_block,YES, +nvshmemx_ptrdiff_iput_block,YES, +nvshmemx_float_iput_warp,YES, +nvshmemx_double_iput_warp,YES, +nvshmemx_char_iput_warp,YES, +nvshmemx_schar_iput_warp,YES, +nvshmemx_short_iput_warp,YES, +nvshmemx_int_iput_warp,YES, +nvshmemx_long_iput_warp,YES, +nvshmemx_longlong_iput_warp,YES, +nvshmemx_uchar_iput_warp,YES, +nvshmemx_ushort_iput_warp,YES, +nvshmemx_uint_iput_warp,YES, +nvshmemx_ulong_iput_warp,YES, +nvshmemx_ulonglong_iput_warp,YES, +nvshmemx_int8_iput_warp,YES, +nvshmemx_int16_iput_warp,YES, +nvshmemx_int32_iput_warp,YES, +nvshmemx_int64_iput_warp,YES, +nvshmemx_uint8_iput_warp,YES, +nvshmemx_uint16_iput_warp,YES, +nvshmemx_uint32_iput_warp,YES, +nvshmemx_uint64_iput_warp,YES, +nvshmemx_size_iput_warp,YES, +nvshmemx_ptrdiff_iput_warp,YES, +nvshmem_iput8,YES, +nvshmem_iput16,YES, +nvshmem_iput32,YES, +nvshmem_iput64,YES, +nvshmem_iput128,YES, +nvshmemx_iput8_on_stream,YES, +nvshmemx_iput16_on_stream,YES, +nvshmemx_iput32_on_stream,YES, +nvshmemx_iput64_on_stream,YES, +nvshmemx_iput128_on_stream,YES, +nvshmemx_iput8_block,YES, +nvshmemx_iput16_block,YES, +nvshmemx_iput32_block,YES, +nvshmemx_iput64_block,YES, +nvshmemx_iput128_block,YES, +nvshmemx_iput8_warp,YES, +nvshmemx_iput16_warp,YES, +nvshmemx_iput32_warp,YES, +nvshmemx_iput64_warp,YES, +nvshmemx_iput128_warp,YES, +nvshmem_float_get,YES, +nvshmem_double_get,YES, +nvshmem_char_get,YES, +nvshmem_schar_get,YES, +nvshmem_short_get,YES, +nvshmem_int_get,YES, +nvshmem_long_get,YES, +nvshmem_longlong_get,YES, +nvshmem_uchar_get,YES, +nvshmem_ushort_get,YES, +nvshmem_uint_get,YES, +nvshmem_ulong_get,YES, +nvshmem_ulonglong_get,YES, +nvshmem_int8_get,YES, +nvshmem_int16_get,YES, +nvshmem_int32_get,YES, +nvshmem_int64_get,YES, +nvshmem_uint8_get,YES, +nvshmem_uint16_get,YES, +nvshmem_uint32_get,YES, +nvshmem_uint64_get,YES, +nvshmem_size_get,YES, +nvshmem_ptrdiff_get,YES, +nvshmemx_float_get_on_stream,YES, +nvshmemx_double_get_on_stream,YES, +nvshmemx_char_get_on_stream,YES, +nvshmemx_schar_get_on_stream,YES, +nvshmemx_short_get_on_stream,YES, +nvshmemx_int_get_on_stream,YES, +nvshmemx_long_get_on_stream,YES, +nvshmemx_longlong_get_on_stream,YES, +nvshmemx_uchar_get_on_stream,YES, +nvshmemx_ushort_get_on_stream,YES, +nvshmemx_uint_get_on_stream,YES, +nvshmemx_ulong_get_on_stream,YES, +nvshmemx_ulonglong_get_on_stream,YES, +nvshmemx_int8_get_on_stream,YES, +nvshmemx_int16_get_on_stream,YES, +nvshmemx_int32_get_on_stream,YES, +nvshmemx_int64_get_on_stream,YES, +nvshmemx_uint8_get_on_stream,YES, +nvshmemx_uint16_get_on_stream,YES, +nvshmemx_uint32_get_on_stream,YES, +nvshmemx_uint64_get_on_stream,YES, +nvshmemx_size_get_on_stream,YES, +nvshmemx_ptrdiff_get_on_stream,YES, +nvshmemx_float_get_block,YES, +nvshmemx_double_get_block,YES, +nvshmemx_char_get_block,YES, +nvshmemx_schar_get_block,YES, +nvshmemx_short_get_block,YES, +nvshmemx_int_get_block,YES, +nvshmemx_long_get_block,YES, +nvshmemx_longlong_get_block,YES, +nvshmemx_uchar_get_block,YES, +nvshmemx_ushort_get_block,YES, +nvshmemx_uint_get_block,YES, +nvshmemx_ulong_get_block,YES, +nvshmemx_ulonglong_get_block,YES, +nvshmemx_int8_get_block,YES, +nvshmemx_int16_get_block,YES, +nvshmemx_int32_get_block,YES, +nvshmemx_int64_get_block,YES, +nvshmemx_uint8_get_block,YES, +nvshmemx_uint16_get_block,YES, +nvshmemx_uint32_get_block,YES, +nvshmemx_uint64_get_block,YES, +nvshmemx_size_get_block,YES, +nvshmemx_ptrdiff_get_block,YES, +nvshmemx_float_get_warp,YES, +nvshmemx_double_get_warp,YES, +nvshmemx_char_get_warp,YES, +nvshmemx_schar_get_warp,YES, +nvshmemx_short_get_warp,YES, +nvshmemx_int_get_warp,YES, +nvshmemx_long_get_warp,YES, +nvshmemx_longlong_get_warp,YES, +nvshmemx_uchar_get_warp,YES, +nvshmemx_ushort_get_warp,YES, +nvshmemx_uint_get_warp,YES, +nvshmemx_ulong_get_warp,YES, +nvshmemx_ulonglong_get_warp,YES, +nvshmemx_int8_get_warp,YES, +nvshmemx_int16_get_warp,YES, +nvshmemx_int32_get_warp,YES, +nvshmemx_int64_get_warp,YES, +nvshmemx_uint8_get_warp,YES, +nvshmemx_uint16_get_warp,YES, +nvshmemx_uint32_get_warp,YES, +nvshmemx_uint64_get_warp,YES, +nvshmemx_size_get_warp,YES, +nvshmemx_ptrdiff_get_warp,YES, +nvshmem_get8,YES, +nvshmem_get16,YES, +nvshmem_get32,YES, +nvshmem_get64,YES, +nvshmem_get128,YES, +nvshmemx_get8_on_stream,YES, +nvshmemx_get16_on_stream,YES, +nvshmemx_get32_on_stream,YES, +nvshmemx_get64_on_stream,YES, +nvshmemx_get128_on_stream,YES, +nvshmemx_get8_block,YES, +nvshmemx_get16_block,YES, +nvshmemx_get32_block,YES, +nvshmemx_get64_block,YES, +nvshmemx_get128_block,YES, +nvshmemx_get8_warp,YES, +nvshmemx_get16_warp,YES, +nvshmemx_get32_warp,YES, +nvshmemx_get64_warp,YES, +nvshmemx_get128_warp,YES, +nvshmem_getmem,YES, +nvshmemx_getmem_on_stream,YES, +nvshmemx_getmem_block,YES, +nvshmemx_getmem_warp,YES, +nvshmem_float_g,YES, +nvshmem_double_g,YES, +nvshmem_char_g,YES, +nvshmem_schar_g,YES, +nvshmem_short_g,YES, +nvshmem_int_g,YES, +nvshmem_long_g,YES, +nvshmem_longlong_g,YES, +nvshmem_uchar_g,YES, +nvshmem_ushort_g,YES, +nvshmem_uint_g,YES, +nvshmem_ulong_g,YES, +nvshmem_ulonglong_g,YES, +nvshmem_int8_g,YES, +nvshmem_int16_g,YES, +nvshmem_int32_g,YES, +nvshmem_int64_g,YES, +nvshmem_uint8_g,YES, +nvshmem_uint16_g,YES, +nvshmem_uint32_g,YES, +nvshmem_uint64_g,YES, +nvshmem_size_g,YES, +nvshmem_ptrdiff_g,YES, +nvshmem_float_iget,YES, +nvshmem_double_iget,YES, +nvshmem_char_iget,YES, +nvshmem_schar_iget,YES, +nvshmem_short_iget,YES, +nvshmem_int_iget,YES, +nvshmem_long_iget,YES, +nvshmem_longlong_iget,YES, +nvshmem_uchar_iget,YES, +nvshmem_ushort_iget,YES, +nvshmem_uint_iget,YES, +nvshmem_ulong_iget,YES, +nvshmem_ulonglong_iget,YES, +nvshmem_int8_iget,YES, +nvshmem_int16_iget,YES, +nvshmem_int32_iget,YES, +nvshmem_int64_iget,YES, +nvshmem_uint8_iget,YES, +nvshmem_uint16_iget,YES, +nvshmem_uint32_iget,YES, +nvshmem_uint64_iget,YES, +nvshmem_size_iget,YES, +nvshmem_ptrdiff_iget,YES, +nvshmemx_float_iget_on_stream,YES, +nvshmemx_double_iget_on_stream,YES, +nvshmemx_char_iget_on_stream,YES, +nvshmemx_schar_iget_on_stream,YES, +nvshmemx_short_iget_on_stream,YES, +nvshmemx_int_iget_on_stream,YES, +nvshmemx_long_iget_on_stream,YES, +nvshmemx_longlong_iget_on_stream,YES, +nvshmemx_uchar_iget_on_stream,YES, +nvshmemx_ushort_iget_on_stream,YES, +nvshmemx_uint_iget_on_stream,YES, +nvshmemx_ulong_iget_on_stream,YES, +nvshmemx_ulonglong_iget_on_stream,YES, +nvshmemx_int8_iget_on_stream,YES, +nvshmemx_int16_iget_on_stream,YES, +nvshmemx_int32_iget_on_stream,YES, +nvshmemx_int64_iget_on_stream,YES, +nvshmemx_uint8_iget_on_stream,YES, +nvshmemx_uint16_iget_on_stream,YES, +nvshmemx_uint32_iget_on_stream,YES, +nvshmemx_uint64_iget_on_stream,YES, +nvshmemx_size_iget_on_stream,YES, +nvshmemx_ptrdiff_iget_on_stream,YES, +nvshmemx_float_iget_block,YES, +nvshmemx_double_iget_block,YES, +nvshmemx_char_iget_block,YES, +nvshmemx_schar_iget_block,YES, +nvshmemx_short_iget_block,YES, +nvshmemx_int_iget_block,YES, +nvshmemx_long_iget_block,YES, +nvshmemx_longlong_iget_block,YES, +nvshmemx_uchar_iget_block,YES, +nvshmemx_ushort_iget_block,YES, +nvshmemx_uint_iget_block,YES, +nvshmemx_ulong_iget_block,YES, +nvshmemx_ulonglong_iget_block,YES, +nvshmemx_int8_iget_block,YES, +nvshmemx_int16_iget_block,YES, +nvshmemx_int32_iget_block,YES, +nvshmemx_int64_iget_block,YES, +nvshmemx_uint8_iget_block,YES, +nvshmemx_uint16_iget_block,YES, +nvshmemx_uint32_iget_block,YES, +nvshmemx_uint64_iget_block,YES, +nvshmemx_size_iget_block,YES, +nvshmemx_ptrdiff_iget_block,YES, +nvshmemx_float_iget_warp,YES, +nvshmemx_double_iget_warp,YES, +nvshmemx_char_iget_warp,YES, +nvshmemx_schar_iget_warp,YES, +nvshmemx_short_iget_warp,YES, +nvshmemx_int_iget_warp,YES, +nvshmemx_long_iget_warp,YES, +nvshmemx_longlong_iget_warp,YES, +nvshmemx_uchar_iget_warp,YES, +nvshmemx_ushort_iget_warp,YES, +nvshmemx_uint_iget_warp,YES, +nvshmemx_ulong_iget_warp,YES, +nvshmemx_ulonglong_iget_warp,YES, +nvshmemx_int8_iget_warp,YES, +nvshmemx_int16_iget_warp,YES, +nvshmemx_int32_iget_warp,YES, +nvshmemx_int64_iget_warp,YES, +nvshmemx_uint8_iget_warp,YES, +nvshmemx_uint16_iget_warp,YES, +nvshmemx_uint32_iget_warp,YES, +nvshmemx_uint64_iget_warp,YES, +nvshmemx_size_iget_warp,YES, +nvshmemx_ptrdiff_iget_warp,YES, +nvshmem_iget8,YES, +nvshmem_iget16,YES, +nvshmem_iget32,YES, +nvshmem_iget64,YES, +nvshmem_iget128,YES, +nvshmemx_iget8_on_stream,YES, +nvshmemx_iget16_on_stream,YES, +nvshmemx_iget32_on_stream,YES, +nvshmemx_iget64_on_stream,YES, +nvshmemx_iget128_on_stream,YES, +nvshmemx_iget8_block,YES, +nvshmemx_iget16_block,YES, +nvshmemx_iget32_block,YES, +nvshmemx_iget64_block,YES, +nvshmemx_iget128_block,YES, +nvshmemx_iget8_warp,YES, +nvshmemx_iget16_warp,YES, +nvshmemx_iget32_warp,YES, +nvshmemx_iget64_warp,YES, +nvshmemx_iget128_warp,YES, +nvshmem_float_put_nbi,YES, +nvshmem_double_put_nbi,YES, +nvshmem_char_put_nbi,YES, +nvshmem_schar_put_nbi,YES, +nvshmem_short_put_nbi,YES, +nvshmem_int_put_nbi,YES, +nvshmem_long_put_nbi,YES, +nvshmem_longlong_put_nbi,YES, +nvshmem_uchar_put_nbi,YES, +nvshmem_ushort_put_nbi,YES, +nvshmem_uint_put_nbi,YES, +nvshmem_ulong_put_nbi,YES, +nvshmem_ulonglong_put_nbi,YES, +nvshmem_int8_put_nbi,YES, +nvshmem_int16_put_nbi,YES, +nvshmem_int32_put_nbi,YES, +nvshmem_int64_put_nbi,YES, +nvshmem_uint8_put_nbi,YES, +nvshmem_uint16_put_nbi,YES, +nvshmem_uint32_put_nbi,YES, +nvshmem_uint64_put_nbi,YES, +nvshmem_size_put_nbi,YES, +nvshmem_ptrdiff_put_nbi,YES, +nvshmemx_float_put_nbi_on_stream,YES, +nvshmemx_double_put_nbi_on_stream,YES, +nvshmemx_char_put_nbi_on_stream,YES, +nvshmemx_schar_put_nbi_on_stream,YES, +nvshmemx_short_put_nbi_on_stream,YES, +nvshmemx_int_put_nbi_on_stream,YES, +nvshmemx_long_put_nbi_on_stream,YES, +nvshmemx_longlong_put_nbi_on_stream,YES, +nvshmemx_uchar_put_nbi_on_stream,YES, +nvshmemx_ushort_put_nbi_on_stream,YES, +nvshmemx_uint_put_nbi_on_stream,YES, +nvshmemx_ulong_put_nbi_on_stream,YES, +nvshmemx_ulonglong_put_nbi_on_stream,YES, +nvshmemx_int8_put_nbi_on_stream,YES, +nvshmemx_int16_put_nbi_on_stream,YES, +nvshmemx_int32_put_nbi_on_stream,YES, +nvshmemx_int64_put_nbi_on_stream,YES, +nvshmemx_uint8_put_nbi_on_stream,YES, +nvshmemx_uint16_put_nbi_on_stream,YES, +nvshmemx_uint32_put_nbi_on_stream,YES, +nvshmemx_uint64_put_nbi_on_stream,YES, +nvshmemx_size_put_nbi_on_stream,YES, +nvshmemx_ptrdiff_put_nbi_on_stream,YES, +nvshmemx_float_put_nbi_block,YES, +nvshmemx_double_put_nbi_block,YES, +nvshmemx_char_put_nbi_block,YES, +nvshmemx_schar_put_nbi_block,YES, +nvshmemx_short_put_nbi_block,YES, +nvshmemx_int_put_nbi_block,YES, +nvshmemx_long_put_nbi_block,YES, +nvshmemx_longlong_put_nbi_block,YES, +nvshmemx_uchar_put_nbi_block,YES, +nvshmemx_ushort_put_nbi_block,YES, +nvshmemx_uint_put_nbi_block,YES, +nvshmemx_ulong_put_nbi_block,YES, +nvshmemx_ulonglong_put_nbi_block,YES, +nvshmemx_int8_put_nbi_block,YES, +nvshmemx_int16_put_nbi_block,YES, +nvshmemx_int32_put_nbi_block,YES, +nvshmemx_int64_put_nbi_block,YES, +nvshmemx_uint8_put_nbi_block,YES, +nvshmemx_uint16_put_nbi_block,YES, +nvshmemx_uint32_put_nbi_block,YES, +nvshmemx_uint64_put_nbi_block,YES, +nvshmemx_size_put_nbi_block,YES, +nvshmemx_ptrdiff_put_nbi_block,YES, +nvshmemx_float_put_nbi_warp,YES, +nvshmemx_double_put_nbi_warp,YES, +nvshmemx_char_put_nbi_warp,YES, +nvshmemx_schar_put_nbi_warp,YES, +nvshmemx_short_put_nbi_warp,YES, +nvshmemx_int_put_nbi_warp,YES, +nvshmemx_long_put_nbi_warp,YES, +nvshmemx_longlong_put_nbi_warp,YES, +nvshmemx_uchar_put_nbi_warp,YES, +nvshmemx_ushort_put_nbi_warp,YES, +nvshmemx_uint_put_nbi_warp,YES, +nvshmemx_ulong_put_nbi_warp,YES, +nvshmemx_ulonglong_put_nbi_warp,YES, +nvshmemx_int8_put_nbi_warp,YES, +nvshmemx_int16_put_nbi_warp,YES, +nvshmemx_int32_put_nbi_warp,YES, +nvshmemx_int64_put_nbi_warp,YES, +nvshmemx_uint8_put_nbi_warp,YES, +nvshmemx_uint16_put_nbi_warp,YES, +nvshmemx_uint32_put_nbi_warp,YES, +nvshmemx_uint64_put_nbi_warp,YES, +nvshmemx_size_put_nbi_warp,YES, +nvshmemx_ptrdiff_put_nbi_warp,YES, +nvshmem_put8_nbi,YES, +nvshmem_put16_nbi,YES, +nvshmem_put32_nbi,YES, +nvshmem_put64_nbi,YES, +nvshmem_put128_nbi,YES, +nvshmemx_put8_nbi_on_stream,YES, +nvshmemx_put16_nbi_on_stream,YES, +nvshmemx_put32_nbi_on_stream,YES, +nvshmemx_put64_nbi_on_stream,YES, +nvshmemx_put128_nbi_on_stream,YES, +nvshmemx_put8_nbi_block,YES, +nvshmemx_put16_nbi_block,YES, +nvshmemx_put32_nbi_block,YES, +nvshmemx_put64_nbi_block,YES, +nvshmemx_put128_nbi_block,YES, +nvshmemx_put8_nbi_warp,YES, +nvshmemx_put16_nbi_warp,YES, +nvshmemx_put32_nbi_warp,YES, +nvshmemx_put64_nbi_warp,YES, +nvshmemx_put128_nbi_warp,YES, nvshmem_putmem_nbi,YES, -nvshmemx_putmem_nbi_on_stream,NO, -nvshmemx_putmem_nbi_block,NO, -nvshmemx_putmem_nbi_warp,NO, -nvshmem_float_get_nbi,NO, -nvshmem_double_get_nbi,NO, -nvshmem_char_get_nbi,NO, -nvshmem_schar_get_nbi,NO, -nvshmem_short_get_nbi,NO, -nvshmem_int_get_nbi,NO, -nvshmem_long_get_nbi,NO, -nvshmem_longlong_get_nbi,NO, -nvshmem_uchar_get_nbi,NO, -nvshmem_ushort_get_nbi,NO, -nvshmem_uint_get_nbi,NO, -nvshmem_ulong_get_nbi,NO, -nvshmem_ulonglong_get_nbi,NO, -nvshmem_int8_get_nbi,NO, -nvshmem_int16_get_nbi,NO, -nvshmem_int32_get_nbi,NO, -nvshmem_int64_get_nbi,NO, -nvshmem_uint8_get_nbi,NO, -nvshmem_uint16_get_nbi,NO, -nvshmem_uint32_get_nbi,NO, -nvshmem_uint64_get_nbi,NO, -nvshmem_size_get_nbi,NO, -nvshmem_ptrdiff_get_nbi,NO, -nvshmemx_float_get_nbi_on_stream,NO, -nvshmemx_double_get_nbi_on_stream,NO, -nvshmemx_char_get_nbi_on_stream,NO, -nvshmemx_schar_get_nbi_on_stream,NO, -nvshmemx_short_get_nbi_on_stream,NO, -nvshmemx_int_get_nbi_on_stream,NO, -nvshmemx_long_get_nbi_on_stream,NO, -nvshmemx_longlong_get_nbi_on_stream,NO, -nvshmemx_uchar_get_nbi_on_stream,NO, -nvshmemx_ushort_get_nbi_on_stream,NO, -nvshmemx_uint_get_nbi_on_stream,NO, -nvshmemx_ulong_get_nbi_on_stream,NO, -nvshmemx_ulonglong_get_nbi_on_stream,NO, -nvshmemx_int8_get_nbi_on_stream,NO, -nvshmemx_int16_get_nbi_on_stream,NO, -nvshmemx_int32_get_nbi_on_stream,NO, -nvshmemx_int64_get_nbi_on_stream,NO, -nvshmemx_uint8_get_nbi_on_stream,NO, -nvshmemx_uint16_get_nbi_on_stream,NO, -nvshmemx_uint32_get_nbi_on_stream,NO, -nvshmemx_uint64_get_nbi_on_stream,NO, -nvshmemx_size_get_nbi_on_stream,NO, -nvshmemx_ptrdiff_get_nbi_on_stream,NO, -nvshmemx_float_get_nbi_block,NO, -nvshmemx_double_get_nbi_block,NO, -nvshmemx_char_get_nbi_block,NO, -nvshmemx_schar_get_nbi_block,NO, -nvshmemx_short_get_nbi_block,NO, -nvshmemx_int_get_nbi_block,NO, -nvshmemx_long_get_nbi_block,NO, -nvshmemx_longlong_get_nbi_block,NO, -nvshmemx_uchar_get_nbi_block,NO, -nvshmemx_ushort_get_nbi_block,NO, -nvshmemx_uint_get_nbi_block,NO, -nvshmemx_ulong_get_nbi_block,NO, -nvshmemx_ulonglong_get_nbi_block,NO, -nvshmemx_int8_get_nbi_block,NO, -nvshmemx_int16_get_nbi_block,NO, -nvshmemx_int32_get_nbi_block,NO, -nvshmemx_int64_get_nbi_block,NO, -nvshmemx_uint8_get_nbi_block,NO, -nvshmemx_uint16_get_nbi_block,NO, -nvshmemx_uint32_get_nbi_block,NO, -nvshmemx_uint64_get_nbi_block,NO, -nvshmemx_size_get_nbi_block,NO, -nvshmemx_ptrdiff_get_nbi_block,NO, -nvshmemx_float_get_nbi_warp,NO, -nvshmemx_double_get_nbi_warp,NO, -nvshmemx_char_get_nbi_warp,NO, -nvshmemx_schar_get_nbi_warp,NO, -nvshmemx_short_get_nbi_warp,NO, -nvshmemx_int_get_nbi_warp,NO, -nvshmemx_long_get_nbi_warp,NO, -nvshmemx_longlong_get_nbi_warp,NO, -nvshmemx_uchar_get_nbi_warp,NO, -nvshmemx_ushort_get_nbi_warp,NO, -nvshmemx_uint_get_nbi_warp,NO, -nvshmemx_ulong_get_nbi_warp,NO, -nvshmemx_ulonglong_get_nbi_warp,NO, -nvshmemx_int8_get_nbi_warp,NO, -nvshmemx_int16_get_nbi_warp,NO, -nvshmemx_int32_get_nbi_warp,NO, -nvshmemx_int64_get_nbi_warp,NO, -nvshmemx_uint8_get_nbi_warp,NO, -nvshmemx_uint16_get_nbi_warp,NO, -nvshmemx_uint32_get_nbi_warp,NO, -nvshmemx_uint64_get_nbi_warp,NO, -nvshmemx_size_get_nbi_warp,NO, -nvshmemx_ptrdiff_get_nbi_warp,NO, -nvshmem_get8_nbi,NO, -nvshmem_get16_nbi,NO, -nvshmem_get32_nbi,NO, -nvshmem_get64_nbi,NO, -nvshmem_get128_nbi,NO, -nvshmemx_get8_nbi_on_stream,NO, -nvshmemx_get16_nbi_on_stream,NO, -nvshmemx_get32_nbi_on_stream,NO, -nvshmemx_get64_nbi_on_stream,NO, -nvshmemx_get128_nbi_on_stream,NO, -nvshmemx_get8_nbi_block,NO, -nvshmemx_get16_nbi_block,NO, -nvshmemx_get32_nbi_block,NO, -nvshmemx_get64_nbi_block,NO, -nvshmemx_get128_nbi_block,NO, -nvshmemx_get8_nbi_warp,NO, -nvshmemx_get16_nbi_warp,NO, -nvshmemx_get32_nbi_warp,NO, -nvshmemx_get64_nbi_warp,NO, -nvshmemx_get128_nbi_warp,NO, -nvshmem_getmem_nbi,NO, -nvshmemx_getmem_nbi_on_stream,NO, -nvshmemx_getmem_nbi_block,NO, -nvshmemx_getmem_nbi_warp,NO, +nvshmemx_putmem_nbi_on_stream,YES, +nvshmemx_putmem_nbi_block,YES, +nvshmemx_putmem_nbi_warp,YES, +nvshmem_float_get_nbi,YES, +nvshmem_double_get_nbi,YES, +nvshmem_char_get_nbi,YES, +nvshmem_schar_get_nbi,YES, +nvshmem_short_get_nbi,YES, +nvshmem_int_get_nbi,YES, +nvshmem_long_get_nbi,YES, +nvshmem_longlong_get_nbi,YES, +nvshmem_uchar_get_nbi,YES, +nvshmem_ushort_get_nbi,YES, +nvshmem_uint_get_nbi,YES, +nvshmem_ulong_get_nbi,YES, +nvshmem_ulonglong_get_nbi,YES, +nvshmem_int8_get_nbi,YES, +nvshmem_int16_get_nbi,YES, +nvshmem_int32_get_nbi,YES, +nvshmem_int64_get_nbi,YES, +nvshmem_uint8_get_nbi,YES, +nvshmem_uint16_get_nbi,YES, +nvshmem_uint32_get_nbi,YES, +nvshmem_uint64_get_nbi,YES, +nvshmem_size_get_nbi,YES, +nvshmem_ptrdiff_get_nbi,YES, +nvshmemx_float_get_nbi_on_stream,YES, +nvshmemx_double_get_nbi_on_stream,YES, +nvshmemx_char_get_nbi_on_stream,YES, +nvshmemx_schar_get_nbi_on_stream,YES, +nvshmemx_short_get_nbi_on_stream,YES, +nvshmemx_int_get_nbi_on_stream,YES, +nvshmemx_long_get_nbi_on_stream,YES, +nvshmemx_longlong_get_nbi_on_stream,YES, +nvshmemx_uchar_get_nbi_on_stream,YES, +nvshmemx_ushort_get_nbi_on_stream,YES, +nvshmemx_uint_get_nbi_on_stream,YES, +nvshmemx_ulong_get_nbi_on_stream,YES, +nvshmemx_ulonglong_get_nbi_on_stream,YES, +nvshmemx_int8_get_nbi_on_stream,YES, +nvshmemx_int16_get_nbi_on_stream,YES, +nvshmemx_int32_get_nbi_on_stream,YES, +nvshmemx_int64_get_nbi_on_stream,YES, +nvshmemx_uint8_get_nbi_on_stream,YES, +nvshmemx_uint16_get_nbi_on_stream,YES, +nvshmemx_uint32_get_nbi_on_stream,YES, +nvshmemx_uint64_get_nbi_on_stream,YES, +nvshmemx_size_get_nbi_on_stream,YES, +nvshmemx_ptrdiff_get_nbi_on_stream,YES, +nvshmemx_float_get_nbi_block,YES, +nvshmemx_double_get_nbi_block,YES, +nvshmemx_char_get_nbi_block,YES, +nvshmemx_schar_get_nbi_block,YES, +nvshmemx_short_get_nbi_block,YES, +nvshmemx_int_get_nbi_block,YES, +nvshmemx_long_get_nbi_block,YES, +nvshmemx_longlong_get_nbi_block,YES, +nvshmemx_uchar_get_nbi_block,YES, +nvshmemx_ushort_get_nbi_block,YES, +nvshmemx_uint_get_nbi_block,YES, +nvshmemx_ulong_get_nbi_block,YES, +nvshmemx_ulonglong_get_nbi_block,YES, +nvshmemx_int8_get_nbi_block,YES, +nvshmemx_int16_get_nbi_block,YES, +nvshmemx_int32_get_nbi_block,YES, +nvshmemx_int64_get_nbi_block,YES, +nvshmemx_uint8_get_nbi_block,YES, +nvshmemx_uint16_get_nbi_block,YES, +nvshmemx_uint32_get_nbi_block,YES, +nvshmemx_uint64_get_nbi_block,YES, +nvshmemx_size_get_nbi_block,YES, +nvshmemx_ptrdiff_get_nbi_block,YES, +nvshmemx_float_get_nbi_warp,YES, +nvshmemx_double_get_nbi_warp,YES, +nvshmemx_char_get_nbi_warp,YES, +nvshmemx_schar_get_nbi_warp,YES, +nvshmemx_short_get_nbi_warp,YES, +nvshmemx_int_get_nbi_warp,YES, +nvshmemx_long_get_nbi_warp,YES, +nvshmemx_longlong_get_nbi_warp,YES, +nvshmemx_uchar_get_nbi_warp,YES, +nvshmemx_ushort_get_nbi_warp,YES, +nvshmemx_uint_get_nbi_warp,YES, +nvshmemx_ulong_get_nbi_warp,YES, +nvshmemx_ulonglong_get_nbi_warp,YES, +nvshmemx_int8_get_nbi_warp,YES, +nvshmemx_int16_get_nbi_warp,YES, +nvshmemx_int32_get_nbi_warp,YES, +nvshmemx_int64_get_nbi_warp,YES, +nvshmemx_uint8_get_nbi_warp,YES, +nvshmemx_uint16_get_nbi_warp,YES, +nvshmemx_uint32_get_nbi_warp,YES, +nvshmemx_uint64_get_nbi_warp,YES, +nvshmemx_size_get_nbi_warp,YES, +nvshmemx_ptrdiff_get_nbi_warp,YES, +nvshmem_get8_nbi,YES, +nvshmem_get16_nbi,YES, +nvshmem_get32_nbi,YES, +nvshmem_get64_nbi,YES, +nvshmem_get128_nbi,YES, +nvshmemx_get8_nbi_on_stream,YES, +nvshmemx_get16_nbi_on_stream,YES, +nvshmemx_get32_nbi_on_stream,YES, +nvshmemx_get64_nbi_on_stream,YES, +nvshmemx_get128_nbi_on_stream,YES, +nvshmemx_get8_nbi_block,YES, +nvshmemx_get16_nbi_block,YES, +nvshmemx_get32_nbi_block,YES, +nvshmemx_get64_nbi_block,YES, +nvshmemx_get128_nbi_block,YES, +nvshmemx_get8_nbi_warp,YES, +nvshmemx_get16_nbi_warp,YES, +nvshmemx_get32_nbi_warp,YES, +nvshmemx_get64_nbi_warp,YES, +nvshmemx_get128_nbi_warp,YES, +nvshmem_getmem_nbi,YES, +nvshmemx_getmem_nbi_on_stream,YES, +nvshmemx_getmem_nbi_block,YES, +nvshmemx_getmem_nbi_warp,YES, nvshmem_float_atomic_fetch,NO, nvshmem_double_atomic_fetch,NO, nvshmem_int_atomic_fetch,NO, @@ -1085,7 +1085,7 @@ nvshmemx_putmem_signal_nbi_warp,NO, nvshmem_signal_fetch,NO, nvshmemx_signal_op,YES, nvshmem_barrier_all,NO, -nvshmemx_barrier_all_on_stream,NO, +nvshmemx_barrier_all_on_stream,YES, nvshmemx_barrier_all_block,NO, nvshmemx_barrier_all_warp,NO, nvshmem_barrier,NO, @@ -2117,6 +2117,6 @@ nvshmem_size_test_some_vector,NO, nvshmem_ptrdiff_test_some_vector,NO, nvshmemx_signal_wait_until_on_stream,NO, nvshmem_signal_wait_until,YES, -nvshmem_fence,NO, -nvshmem_quiet,NO, -nvshmemx_quiet_on_stream,NO, +nvshmem_fence,YES, +nvshmem_quiet,YES, +nvshmemx_quiet_on_stream,YES,