Skip to content

Commit 1d04d8e

Browse files
committed
UCT/CUDA/COPY: Revert qualify cuda_copy for RNDV with peer-failure EH
1 parent e91d676 commit 1d04d8e

2 files changed

Lines changed: 3 additions & 23 deletions

File tree

src/uct/cuda/cuda_copy/cuda_copy_iface.c

Lines changed: 1 addition & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -104,11 +104,7 @@ static ucs_status_t uct_cuda_copy_iface_query(uct_iface_h tl_iface,
104104
iface_attr->iface_addr_len = sizeof(uct_cuda_copy_iface_addr_t);
105105
iface_attr->device_addr_len = 0;
106106
iface_attr->ep_addr_len = 0;
107-
/* UCT_IFACE_FLAG_ERRHANDLE_PEER_FAILURE required for RMA BW wireup
108-
* (ucp_wireup_fill_peer_err_criteria) when error handling is requested.
109-
* Transfers are local copies; UCP handles invalidation when a peer fails. */
110-
iface_attr->cap.flags = UCT_IFACE_FLAG_ERRHANDLE_PEER_FAILURE |
111-
UCT_IFACE_FLAG_CONNECT_TO_IFACE |
107+
iface_attr->cap.flags = UCT_IFACE_FLAG_CONNECT_TO_IFACE |
112108
UCT_IFACE_FLAG_GET_SHORT |
113109
UCT_IFACE_FLAG_PUT_SHORT |
114110
UCT_IFACE_FLAG_GET_ZCOPY |

src/uct/cuda/cuda_copy/cuda_copy_md.c

Lines changed: 2 additions & 18 deletions
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,6 @@
2020
#include <ucs/sys/ptr_arith.h>
2121
#include <uct/cuda/base/cuda_ctx.inl>
2222
#include <uct/api/v2/uct_v2.h>
23-
#include <uct/base/uct_iface.h>
2423
#include <cuda.h>
2524
#if CUDA_VERSION >= 11070
2625
#include <cudaTypedefs.h>
@@ -119,14 +118,7 @@ uct_cuda_copy_md_query(uct_md_h uct_md, uct_md_attr_v2_t *md_attr)
119118
uct_cuda_copy_md_t *md = ucs_derived_of(uct_md, uct_cuda_copy_md_t);
120119

121120
uct_md_base_md_query(md_attr);
122-
/* Advertise RMA invalidation so RMA BW lanes qualify for UCP wireup when
123-
* UCP_EP_INIT_ERR_MODE_PEER_FAILURE is set with RNDV (see
124-
* ucp_wireup_add_rma_bw_lanes). cuda_copy has no remote RMA keys; local
125-
* registration teardown is synchronous and satisfies the invalidate
126-
* contract via uct_cuda_copy_mem_dereg(). */
127-
md_attr->flags = UCT_MD_FLAG_REG | UCT_MD_FLAG_ALLOC |
128-
UCT_MD_FLAG_INVALIDATE |
129-
UCT_MD_FLAG_INVALIDATE_RMA;
121+
md_attr->flags = UCT_MD_FLAG_REG | UCT_MD_FLAG_ALLOC;
130122
md_attr->reg_mem_types = UCS_BIT(UCS_MEMORY_TYPE_HOST) |
131123
UCS_BIT(UCS_MEMORY_TYPE_CUDA) |
132124
UCS_BIT(UCS_MEMORY_TYPE_CUDA_MANAGED);
@@ -188,21 +180,13 @@ UCS_PROFILE_FUNC(ucs_status_t, uct_cuda_copy_mem_dereg,
188180
(md, params),
189181
uct_md_h md, const uct_md_mem_dereg_params_t *params)
190182
{
191-
unsigned flags;
192-
193-
UCT_MD_MEM_DEREG_CHECK_PARAMS(params, 1);
183+
UCT_MD_MEM_DEREG_CHECK_PARAMS(params, 0);
194184

195185
if (params->memh != &uct_cuda_dummy_memh) {
196186
UCT_CUDADRV_FUNC(cuMemHostUnregister((void*)params->memh),
197187
UCS_LOG_LEVEL_DIAG);
198188
}
199189

200-
flags = UCT_MD_MEM_DEREG_FIELD_VALUE(params, flags, FIELD_FLAGS, 0);
201-
if (flags & UCT_MD_MEM_DEREG_FLAG_INVALIDATE) {
202-
ucs_assert(params->comp != NULL); /* suppress coverity false-positive */
203-
uct_invoke_completion(params->comp, UCS_OK);
204-
}
205-
206190
return UCS_OK;
207191
}
208192

0 commit comments

Comments
 (0)