zilliztech
diff --git a/‎include/knowhere/config.h‎
Lines changed: 1 addition & 1 deletion b/‎include/knowhere/config.h‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎include/knowhere/emb_list_utils.h‎
Lines changed: 14 additions & 13 deletions b/‎include/knowhere/emb_list_utils.h‎
Lines changed: 14 additions & 13 deletions
diff --git a/‎src/index/diskann/diskann.cc‎
Lines changed: 22 additions & 2 deletions b/‎src/index/diskann/diskann.cc‎
Lines changed: 22 additions & 2 deletions
diff --git a/‎src/index/index_node.cc‎
Lines changed: 58 additions & 31 deletions b/‎src/index/index_node.cc‎
Lines changed: 58 additions & 31 deletions
diff --git a/‎src/index/index_static.cc‎
Lines changed: 8 additions & 0 deletions b/‎src/index/index_static.cc‎
Lines changed: 8 additions & 0 deletions
@@ -849,7 +849,7 @@ class BaseConfig : public Config {
         KNOWHERE_CONFIG_DECLARE_FIELD(lemur_hidden_dim)
             .description("Hidden dimension for LEMUR MLP (compressed representation dimension)")
             .set_default(256)
-            .set_range(32, 4096)
+            .set_range(8, 8192)
             .for_train();
         KNOWHERE_CONFIG_DECLARE_FIELD(lemur_num_train_samples)
             .description("Number of training samples for LEMUR MLP")
 
@@ -21,6 +21,7 @@
 #include "knowhere/bitsetview.h"
 #include "knowhere/log.h"
 #include "knowhere/object.h"
+#include "knowhere/utils.h"
 
 namespace knowhere {
 
@@ -199,7 +200,7 @@ using EmbListAggFunc = std::function<std::optional<float>(const float*, size_t,
 
 inline std::optional<EmbListAggFunc>
 get_emb_list_agg_func(const std::string& el_metric_type) {
-    if (el_metric_type == metric::MAX_SIM) {
+    if (IsMetricType(el_metric_type, metric::MAX_SIM)) {
         return get_sum_max_sim;
     }
     return nullptr;
@@ -212,13 +213,13 @@ get_emb_list_agg_func(const std::string& el_metric_type) {
  */
 inline std::optional<std::string>
 get_el_metric_type(const std::string& metric_type) {
-    if (metric_type == metric::MAX_SIM || metric_type == metric::MAX_SIM_IP || metric_type == metric::MAX_SIM_L2 ||
-        metric_type == metric::MAX_SIM_COSINE || metric_type == metric::MAX_SIM_HAMMING ||
-        metric_type == metric::MAX_SIM_JACCARD) {
+    if (IsMetricType(metric_type, metric::MAX_SIM) || IsMetricType(metric_type, metric::MAX_SIM_IP) ||
+        IsMetricType(metric_type, metric::MAX_SIM_L2) || IsMetricType(metric_type, metric::MAX_SIM_COSINE) ||
+        IsMetricType(metric_type, metric::MAX_SIM_HAMMING) || IsMetricType(metric_type, metric::MAX_SIM_JACCARD)) {
         return metric::MAX_SIM;
-    } else if (metric_type == metric::DTW || metric_type == metric::DTW_IP || metric_type == metric::DTW_L2 ||
-               metric_type == metric::DTW_COSINE || metric_type == metric::DTW_HAMMING ||
-               metric_type == metric::DTW_JACCARD) {
+    } else if (IsMetricType(metric_type, metric::DTW) || IsMetricType(metric_type, metric::DTW_IP) ||
+               IsMetricType(metric_type, metric::DTW_L2) || IsMetricType(metric_type, metric::DTW_COSINE) ||
+               IsMetricType(metric_type, metric::DTW_HAMMING) || IsMetricType(metric_type, metric::DTW_JACCARD)) {
         return metric::DTW;
     }
     return std::nullopt;
@@ -231,20 +232,20 @@ get_el_metric_type(const std::string& metric_type) {
  */
 inline std::optional<std::string>
 get_sub_metric_type(const std::string& metric_type) {
-    if (metric_type == metric::MAX_SIM_COSINE || metric_type == metric::MAX_SIM || metric_type == metric::DTW_COSINE ||
-        metric_type == metric::DTW) {
+    if (IsMetricType(metric_type, metric::MAX_SIM_COSINE) || IsMetricType(metric_type, metric::MAX_SIM) ||
+        IsMetricType(metric_type, metric::DTW_COSINE) || IsMetricType(metric_type, metric::DTW)) {
         return metric::COSINE;
     }
-    if (metric_type == metric::MAX_SIM_IP || metric_type == metric::DTW_IP) {
+    if (IsMetricType(metric_type, metric::MAX_SIM_IP) || IsMetricType(metric_type, metric::DTW_IP)) {
         return metric::IP;
     }
-    if (metric_type == metric::MAX_SIM_L2 || metric_type == metric::DTW_L2) {
+    if (IsMetricType(metric_type, metric::MAX_SIM_L2) || IsMetricType(metric_type, metric::DTW_L2)) {
         return metric::L2;
     }
-    if (metric_type == metric::MAX_SIM_HAMMING || metric_type == metric::DTW_HAMMING) {
+    if (IsMetricType(metric_type, metric::MAX_SIM_HAMMING) || IsMetricType(metric_type, metric::DTW_HAMMING)) {
         return metric::HAMMING;
     }
-    if (metric_type == metric::MAX_SIM_JACCARD || metric_type == metric::DTW_JACCARD) {
+    if (IsMetricType(metric_type, metric::MAX_SIM_JACCARD) || IsMetricType(metric_type, metric::DTW_JACCARD)) {
         return metric::JACCARD;
     }
     return std::nullopt;
 
@@ -104,12 +104,25 @@ class DiskANNIndexNode : public IndexNode {
     static bool
     StaticHasRawData(const knowhere::BaseConfig& config, const IndexVersion& version) {
         knowhere::MetricType metric_type = config.metric_type.has_value() ? config.metric_type.value() : "";
-        return IsMetricType(metric_type, metric::L2) || IsMetricType(metric_type, metric::COSINE);
+        const auto& base_metric = get_sub_metric_type(metric_type).value_or(metric_type);
+        return IsMetricType(base_metric, metric::L2) || IsMetricType(base_metric, metric::COSINE);
+    }
+
+    static Status
+    StaticConfigCheck(const Config& cfg, PARAM_TYPE paramType, std::string& msg) {
+        auto& base_cfg = static_cast<const BaseConfig&>(cfg);
+        auto strategy = base_cfg.emb_list_strategy.value_or("");
+        if (strategy == meta::EMB_LIST_STRATEGY_MUVERA || strategy == meta::EMB_LIST_STRATEGY_LEMUR) {
+            msg = "DiskANN only supports TokenANN strategy, got '" + strategy + "'";
+            return Status::invalid_args;
+        }
+        return Status::success;
     }
 
     bool
     HasRawData(const std::string& metric_type) const override {
-        return IsMetricType(metric_type, metric::L2) || IsMetricType(metric_type, metric::COSINE);
+        const auto& base_metric = get_sub_metric_type(metric_type).value_or(metric_type);
+        return IsMetricType(base_metric, metric::L2) || IsMetricType(base_metric, metric::COSINE);
     }
 
     expected<DataSetPtr>
@@ -497,6 +510,13 @@ DiskANNIndexNode<DataType>::BuildEmbListIfNeed(const DataSetPtr dataset, std::sh
         return Build(dataset, std::move(cfg), use_knowhere_build_pool);
     }
 
+    // DiskANN only supports TokenANN strategy
+    auto strategy_type = config.emb_list_strategy.value_or(meta::EMB_LIST_STRATEGY_TOKENANN);
+    if (strategy_type != meta::EMB_LIST_STRATEGY_TOKENANN) {
+        LOG_KNOWHERE_ERROR_ << "DiskANN only supports TokenANN strategy, got: " << strategy_type;
+        return Status::invalid_args;
+    }
+
     LOG_KNOWHERE_INFO_ << "Build emb_list index and read emb_list offset from file.";
 
     // Validate and get the emb_list offset file path
 
@@ -287,25 +287,24 @@ IndexNode::GetEmbListByIds(const DataSetPtr dataset, const std::string& metric_t
                                          "GetEmbListByIds requires emb_list_offset, but it is not available");
     }
     auto sub_metric = get_sub_metric_type(metric_type);
-    if (!sub_metric.has_value() || !HasRawData(sub_metric.value())) {
+    if (!sub_metric.has_value()) {
+        return expected<DataSetPtr>::Err(Status::not_implemented,
+                                         "GetEmbListByIds: invalid metric type " + metric_type);
+    }
+
+    // Raw data can come from emb_list_raw_index_ (MUVERA/LEMUR) or base index (TokenANN)
+    bool use_raw_index = (emb_list_raw_index_ != nullptr);
+    if (!use_raw_index && !HasRawData(sub_metric.value())) {
         return expected<DataSetPtr>::Err(
             Status::not_implemented,
             "GetEmbListByIds requires raw data support, but the index does not store raw vectors");
     }
 
     auto num_el_ids = dataset->GetRows();
     auto el_ids = dataset->GetIds();
-    auto dim = Dim();
-
-    // Build the output offset array and collect all vector-level IDs in a single pass.
-    //
-    // TODO(perf): Vectors within each embedding list are contiguous in the index. However, the current
-    // implementation collects all these contiguous IDs into a flat array and passes them to GetVectorByIds,
-    // which internally calls reconstruct(id, ...) one vector at a time. This could be optimized by using
-    // reconstruct_n(start, len, ...) or direct memcpy from raw data storage, avoiding both the redundant
-    // ID array allocation and per-vector overhead. We don't do this yet because it would require
-    // index-type-specific implementations (HNSW, IVF, FLAT, etc. each store raw data differently),
-    // whereas the current approach works generically across all index types via the GetVectorByIds interface.
+    auto dim = use_raw_index ? emb_list_raw_index_->d : Dim();
+
+    // Build the output offset array
     std::vector<size_t> out_offsets(num_el_ids + 1);
     out_offsets[0] = 0;
     for (int64_t i = 0; i < num_el_ids; i++) {
@@ -318,17 +317,9 @@ IndexNode::GetEmbListByIds(const DataSetPtr dataset, const std::string& metric_t
         out_offsets[i + 1] = out_offsets[i] + emb_list_offset_->get_el_len(el_id);
     }
 
-    std::vector<int64_t> vec_ids;
-    vec_ids.reserve(out_offsets[num_el_ids]);
-    for (int64_t i = 0; i < num_el_ids; i++) {
-        size_t start = emb_list_offset_->offset[el_ids[i]];
-        size_t len = out_offsets[i + 1] - out_offsets[i];
-        for (size_t j = 0; j < len; j++) {
-            vec_ids.push_back(static_cast<int64_t>(start + j));
-        }
-    }
+    auto total_vecs = out_offsets[num_el_ids];
 
-    if (vec_ids.empty()) {
+    if (total_vecs == 0) {
         // all emblist are empty list
         auto result = GenResultDataSet(num_el_ids, dim, (const void*)nullptr);
         auto* offsets_ptr = new size_t[out_offsets.size()];
@@ -337,16 +328,52 @@ IndexNode::GetEmbListByIds(const DataSetPtr dataset, const std::string& metric_t
         return result;
     }
 
-    auto vec_dataset = GenIdsDataSet(vec_ids.size(), vec_ids.data());
-    auto res = GetVectorByIds(vec_dataset, op_context);
-    if (!res.has_value()) {
-        return res;
-    }
+    const void* tensor = nullptr;
+
+    if (use_raw_index) {
+        // MUVERA/LEMUR: vectors are contiguous per el in emb_list_raw_index_, use reconstruct_n
+        auto data = std::make_unique<float[]>(total_vecs * dim);
+        float* ptr = data.get();
+        for (int64_t i = 0; i < num_el_ids; i++) {
+            auto start = static_cast<int64_t>(emb_list_offset_->offset[el_ids[i]]);
+            auto len = static_cast<int64_t>(out_offsets[i + 1] - out_offsets[i]);
+            if (len > 0) {
+                emb_list_raw_index_->reconstruct_n(start, len, ptr);
+                ptr += len * dim;
+            }
+        }
+        tensor = data.release();
+    } else {
+        // TokenANN: collect vec_ids and use base index GetVectorByIds
+        //
+        // TODO(perf): Vectors within each embedding list are contiguous in the index. However, the current
+        // implementation collects all these contiguous IDs into a flat array and passes them to GetVectorByIds,
+        // which internally calls reconstruct(id, ...) one vector at a time. This could be optimized by using
+        // reconstruct_n(start, len, ...) or direct memcpy from raw data storage, avoiding both the redundant
+        // ID array allocation and per-vector overhead. We don't do this yet because it would require
+        // index-type-specific implementations (HNSW, IVF, FLAT, etc. each store raw data differently),
+        // whereas the current approach works generically across all index types via the GetVectorByIds interface.
+        std::vector<int64_t> vec_ids;
+        vec_ids.reserve(total_vecs);
+        for (int64_t i = 0; i < num_el_ids; i++) {
+            size_t start = emb_list_offset_->offset[el_ids[i]];
+            size_t len = out_offsets[i + 1] - out_offsets[i];
+            for (size_t j = 0; j < len; j++) {
+                vec_ids.push_back(static_cast<int64_t>(start + j));
+            }
+        }
+
+        // Build result: transfer tensor ownership from GetVectorByIds result to new dataset
+        auto vec_dataset = GenIdsDataSet(vec_ids.size(), vec_ids.data());
+        auto res = GetVectorByIds(vec_dataset, op_context);
+        if (!res.has_value()) {
+            return res;
+        }
 
-    // Build result: transfer tensor ownership from GetVectorByIds result to new dataset
-    auto vec_result = res.value();
-    auto tensor = vec_result->GetTensor();
-    vec_result->SetIsOwner(false);
+        auto vec_result = res.value();
+        tensor = vec_result->GetTensor();
+        vec_result->SetIsOwner(false);
+    }
 
     auto result = GenResultDataSet(num_el_ids, dim, tensor);
     auto* offsets_ptr = new size_t[out_offsets.size()];
 
@@ -56,6 +56,14 @@ IndexStaticFaced<DataType>::ConfigCheck(const IndexType& indexType, const IndexV
         return status;
     }
 
+    if constexpr (!std::is_same_v<DataType, knowhere::fp32>) {
+        auto strategy = cfg->emb_list_strategy.value_or("");
+        if (strategy == meta::EMB_LIST_STRATEGY_MUVERA || strategy == meta::EMB_LIST_STRATEGY_LEMUR) {
+            msg = "MUVERA/LEMUR strategies only support fp32 data type, got '" + strategy + "'";
+            return Status::invalid_args;
+        }
+    }
+
     if (Instance().staticConfigCheckMap.find(indexType) != Instance().staticConfigCheckMap.end()) {
         return Instance().staticConfigCheckMap[indexType](*cfg, knowhere::PARAM_TYPE::TRAIN, msg);
     }
Original file line number	Diff line number	Diff line change
`@@ -56,6 +56,14 @@ IndexStaticFaced<DataType>::ConfigCheck(const IndexType& indexType, const IndexV`
`56`	`56`	`return status;`
`57`	`57`	`}`
`58`	`58`
	`59`	`+ if constexpr (!std::is_same_v<DataType, knowhere::fp32>) {`
	`60`	`+ auto strategy = cfg->emb_list_strategy.value_or("");`
	`61`	`+ if (strategy == meta::EMB_LIST_STRATEGY_MUVERA \|\| strategy == meta::EMB_LIST_STRATEGY_LEMUR) {`
	`62`	`+ msg = "MUVERA/LEMUR strategies only support fp32 data type, got '" + strategy + "'";`
	`63`	`+ return Status::invalid_args;`
	`64`	`+ }`
	`65`	`+ }`
	`66`	`+`
`59`	`67`	`if (Instance().staticConfigCheckMap.find(indexType) != Instance().staticConfigCheckMap.end()) {`
`60`	`68`	`return Instance().staticConfigCheckMap[indexType](*cfg, knowhere::PARAM_TYPE::TRAIN, msg);`
`61`	`69`	`}`