File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -17,7 +17,8 @@ createEmbeddingArpcService(int64_t model_r
1717 py::object py_tokenizer,
1818 std::shared_ptr<rtp_llm::MultimodalProcessor> mm_processor,
1919 std::shared_ptr<rtp_llm::EmbeddingEngine> engine,
20- kmonitor::MetricsReporterPtr reporter) {
20+ kmonitor::MetricsReporterPtr reporter,
21+ bool arpc_rdma_mode) {
2122 return nullptr ;
2223}
2324
Original file line number Diff line number Diff line change @@ -18,7 +18,8 @@ createEmbeddingArpcService(int64_t model_r
1818 py::object py_tokenizer,
1919 std::shared_ptr<rtp_llm::MultimodalProcessor> mm_processor,
2020 std::shared_ptr<rtp_llm::EmbeddingEngine> engine,
21- kmonitor::MetricsReporterPtr reporter);
21+ kmonitor::MetricsReporterPtr reporter,
22+ bool arpc_rdma_mode = false );
2223
2324// Factory: open-source stub throws for RDMA; internal_source provides real RDMA impl.
2425std::unique_ptr<ArpcServerWrapper> createArpcServerWrapper (bool arpc_rdma_mode,
Original file line number Diff line number Diff line change @@ -220,7 +220,8 @@ void RtpEmbeddingOp::startRpcServer(int64_t model_r
220220 py_tokenizer,
221221 mm_processor,
222222 embedding_engine_,
223- reporter));
223+ reporter,
224+ arpc_rdma_mode));
224225 if (arpc_service) {
225226 RTP_LLM_LOG_INFO (" creating arpc service" );
226227 embedding_rpc_service_ = createArpcServerWrapper (arpc_rdma_mode,
You can’t perform that action at this time.
0 commit comments