Skip to content

Commit e05e4e5

Browse files
committed
feat: support rawstring
1 parent 08f5440 commit e05e4e5

3 files changed

Lines changed: 6 additions & 3 deletions

File tree

rtp_llm/cpp/embedding_engine/arpc/ArpcServiceCreator.cc

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,8 @@ createEmbeddingArpcService(int64_t model_r
1717
py::object py_tokenizer,
1818
std::shared_ptr<rtp_llm::MultimodalProcessor> mm_processor,
1919
std::shared_ptr<rtp_llm::EmbeddingEngine> engine,
20-
kmonitor::MetricsReporterPtr reporter) {
20+
kmonitor::MetricsReporterPtr reporter,
21+
bool arpc_rdma_mode) {
2122
return nullptr;
2223
}
2324

rtp_llm/cpp/embedding_engine/arpc/ArpcServiceCreator.h

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,8 @@ createEmbeddingArpcService(int64_t model_r
1818
py::object py_tokenizer,
1919
std::shared_ptr<rtp_llm::MultimodalProcessor> mm_processor,
2020
std::shared_ptr<rtp_llm::EmbeddingEngine> engine,
21-
kmonitor::MetricsReporterPtr reporter);
21+
kmonitor::MetricsReporterPtr reporter,
22+
bool arpc_rdma_mode = false);
2223

2324
// Factory: open-source stub throws for RDMA; internal_source provides real RDMA impl.
2425
std::unique_ptr<ArpcServerWrapper> createArpcServerWrapper(bool arpc_rdma_mode,

rtp_llm/cpp/pybind/multi_gpu_gpt/RtpEmbeddingOp.cc

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -220,7 +220,8 @@ void RtpEmbeddingOp::startRpcServer(int64_t model_r
220220
py_tokenizer,
221221
mm_processor,
222222
embedding_engine_,
223-
reporter));
223+
reporter,
224+
arpc_rdma_mode));
224225
if (arpc_service) {
225226
RTP_LLM_LOG_INFO("creating arpc service");
226227
embedding_rpc_service_ = createArpcServerWrapper(arpc_rdma_mode,

0 commit comments

Comments
 (0)