@@ -170,10 +170,10 @@ int32_t TcpEndpoint::register_remote_memory_region(const std::string& name, cons
170170 return remote_pool_->register_remote_memory_region (mr_info, name);
171171}
172172
173- // ── async_send ──────────────────────────────────────────
173+ // ── send ──────────────────────────────────────────
174174// chunk_tuple_t = (src_ptr, offset, length) — raw pointers, no MR lookup.
175175
176- std::shared_ptr<TcpSendFuture> TcpEndpoint::async_send (const chunk_tuple_t & chunk, int64_t /* timeout_ms*/ )
176+ std::shared_ptr<TcpSendFuture> TcpEndpoint::send (const chunk_tuple_t & chunk, int64_t /* timeout_ms*/ )
177177{
178178 uintptr_t src = std::get<0 >(chunk) + std::get<1 >(chunk);
179179 size_t len = std::get<2 >(chunk);
@@ -198,7 +198,7 @@ std::shared_ptr<TcpSendFuture> TcpEndpoint::async_send(const chunk_tuple_t& chun
198198 auto * buf = new char [len];
199199 auto cu_err = cudaMemcpy (buf, send_ptr, len, cudaMemcpyDeviceToHost);
200200 if (cu_err != cudaSuccess) {
201- SLIME_LOG_ERROR (" async_send cudaMemcpy D2H: " , cudaGetErrorString (cu_err));
201+ SLIME_LOG_ERROR (" send cudaMemcpy D2H: " , cudaGetErrorString (cu_err));
202202 delete[] buf;
203203 op->completion_status .store (TCP_FAILED, std::memory_order_release);
204204 op->signal ->force_complete ();
@@ -213,7 +213,7 @@ std::shared_ptr<TcpSendFuture> TcpEndpoint::async_send(const chunk_tuple_t& chun
213213 auto session = std::make_shared<ClientSession>(
214214 std::move (conn->socket ), [op, conn, &pool, send_ptr, is_cuda](asio::error_code ec) {
215215 if (ec)
216- SLIME_LOG_WARN (" async_send : " , ec.message ());
216+ SLIME_LOG_WARN (" send : " , ec.message ());
217217 op->completion_status .store (ec ? TCP_FAILED : TCP_SUCCESS, std::memory_order_release);
218218 if (op->signal )
219219 op->signal ->set_comm_done (0 );
@@ -228,10 +228,10 @@ std::shared_ptr<TcpSendFuture> TcpEndpoint::async_send(const chunk_tuple_t& chun
228228 return std::make_shared<TcpSendFuture>(op);
229229}
230230
231- // ── async_recv ──────────────────────────────────────────
231+ // ── recv ──────────────────────────────────────────
232232// chunk_tuple_t = (dst_ptr, offset, length) — raw pointers, no MR lookup.
233233
234- std::shared_ptr<TcpRecvFuture> TcpEndpoint::async_recv (const chunk_tuple_t & chunk, bool exact_size)
234+ std::shared_ptr<TcpRecvFuture> TcpEndpoint::recv (const chunk_tuple_t & chunk, bool exact_size)
235235{
236236 auto op = TcpOpState::create ();
237237 op->signal ->reset_all ();
@@ -258,15 +258,14 @@ std::shared_ptr<TcpRecvFuture> TcpEndpoint::async_recv(const chunk_tuple_t& chun
258258 return std::make_shared<TcpRecvFuture>(op);
259259}
260260
261- // ── async_read ──────────────────────────────────────────
261+ // ── read ──────────────────────────────────────────
262262// Each assign creates an independent ClientSession; all share one OpState.
263263// Future.wait() blocks until every session has signalled its bit.
264264
265- std::shared_ptr<TcpReadWriteFuture> TcpEndpoint::async_read (const std::vector<assign_tuple_t >& assign,
266- int64_t /* timeout_ms*/ )
265+ std::shared_ptr<TcpReadWriteFuture> TcpEndpoint::read (const std::vector<assign_tuple_t >& assign, int64_t /* timeout_ms*/ )
267266{
268267 if (assign.empty ())
269- throw std::runtime_error (" TcpEndpoint::async_read : empty assignment" );
268+ throw std::runtime_error (" TcpEndpoint::read : empty assignment" );
270269
271270 size_t N = assign.size ();
272271 auto op = TcpOpState::create ();
@@ -288,7 +287,7 @@ std::shared_ptr<TcpReadWriteFuture> TcpEndpoint::async_read(const std::vector<as
288287 auto local = local_pool_->get_mr_fast (local_h);
289288 auto remote = remote_pool_->get_remote_mr_fast (remote_h);
290289 if (local.length == 0 || remote.length == 0 )
291- throw std::runtime_error (" TcpEndpoint::async_read : invalid MR handle" );
290+ throw std::runtime_error (" TcpEndpoint::read : invalid MR handle" );
292291
293292 uintptr_t local_dst = local.addr + local_off;
294293 SessionHeader hdr{length, remote.addr + remote_off, OP_READ};
@@ -313,14 +312,14 @@ std::shared_ptr<TcpReadWriteFuture> TcpEndpoint::async_read(const std::vector<as
313312 std::move (conn->socket ),
314313 [op, conn, i, &pool, read_dst, is_cuda, real_dst = local_dst, len = length](asio::error_code ec) {
315314 if (ec) {
316- SLIME_LOG_WARN (" async_read session " , i, " : " , ec.message ());
315+ SLIME_LOG_WARN (" read session " , i, " : " , ec.message ());
317316 op->completion_status .store (TCP_FAILED, std::memory_order_release);
318317 }
319318#ifdef USE_CUDA
320319 if (!ec && is_cuda) {
321320 auto cu_err = cudaMemcpy (reinterpret_cast <void *>(real_dst), read_dst, len, cudaMemcpyHostToDevice);
322321 if (cu_err != cudaSuccess) {
323- SLIME_LOG_ERROR (" async_read cudaMemcpy H2D: " , cudaGetErrorString (cu_err));
322+ SLIME_LOG_ERROR (" read cudaMemcpy H2D: " , cudaGetErrorString (cu_err));
324323 op->completion_status .store (TCP_FAILED, std::memory_order_release);
325324 }
326325 }
@@ -337,14 +336,14 @@ std::shared_ptr<TcpReadWriteFuture> TcpEndpoint::async_read(const std::vector<as
337336 return std::make_shared<TcpReadWriteFuture>(op);
338337}
339338
340- // ── async_write ─────────────────────────────────────────
339+ // ── write ─────────────────────────────────────────
341340// Each assign creates an independent ClientSession; all share one OpState.
342341
343- std::shared_ptr<TcpReadWriteFuture> TcpEndpoint::async_write (const std::vector<assign_tuple_t >& assign,
344- int64_t /* timeout_ms*/ )
342+ std::shared_ptr<TcpReadWriteFuture> TcpEndpoint::write (const std::vector<assign_tuple_t >& assign,
343+ int64_t /* timeout_ms*/ )
345344{
346345 if (assign.empty ())
347- throw std::runtime_error (" TcpEndpoint::async_write : empty assignment" );
346+ throw std::runtime_error (" TcpEndpoint::write : empty assignment" );
348347
349348 size_t N = assign.size ();
350349 auto op = TcpOpState::create ();
@@ -366,7 +365,7 @@ std::shared_ptr<TcpReadWriteFuture> TcpEndpoint::async_write(const std::vector<a
366365 auto local = local_pool_->get_mr_fast (local_h);
367366 auto remote = remote_pool_->get_remote_mr_fast (remote_h);
368367 if (local.length == 0 || remote.length == 0 )
369- throw std::runtime_error (" TcpEndpoint::async_write : invalid MR handle" );
368+ throw std::runtime_error (" TcpEndpoint::write : invalid MR handle" );
370369
371370 uintptr_t src = local.addr + local_off;
372371 SessionHeader hdr{length, remote.addr + remote_off, OP_WRITE};
@@ -385,7 +384,7 @@ std::shared_ptr<TcpReadWriteFuture> TcpEndpoint::async_write(const std::vector<a
385384 auto * buf = new char [length];
386385 auto cu_err = cudaMemcpy (buf, send_ptr, length, cudaMemcpyDeviceToHost);
387386 if (cu_err != cudaSuccess) {
388- SLIME_LOG_ERROR (" async_write cudaMemcpy D2H: " , cudaGetErrorString (cu_err));
387+ SLIME_LOG_ERROR (" write cudaMemcpy D2H: " , cudaGetErrorString (cu_err));
389388 delete[] buf;
390389 op->completion_status .store (TCP_FAILED, std::memory_order_release);
391390 op->signal ->force_complete ();
@@ -400,7 +399,7 @@ std::shared_ptr<TcpReadWriteFuture> TcpEndpoint::async_write(const std::vector<a
400399 auto session = std::make_shared<ClientSession>(
401400 std::move (conn->socket ), [op, conn, i, &pool, send_ptr, is_cuda](asio::error_code ec) {
402401 if (ec) {
403- SLIME_LOG_WARN (" async_write session " , i, " : " , ec.message ());
402+ SLIME_LOG_WARN (" write session " , i, " : " , ec.message ());
404403 op->completion_status .store (TCP_FAILED, std::memory_order_release);
405404 }
406405 if (op->signal )
0 commit comments