lance-format
diff --git a/‎java/lance-jni/src/blocking_scanner.rs‎
Lines changed: 5 additions & 0 deletions b/‎java/lance-jni/src/blocking_scanner.rs‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎java/lance-jni/src/utils.rs‎
Lines changed: 4 additions & 0 deletions b/‎java/lance-jni/src/utils.rs‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎java/src/main/java/org/lance/ipc/Query.java‎
Lines changed: 26 additions & 0 deletions b/‎java/src/main/java/org/lance/ipc/Query.java‎
Lines changed: 26 additions & 0 deletions
diff --git a/‎java/src/test/java/org/lance/JNITest.java‎
Lines changed: 1 addition & 0 deletions b/‎java/src/test/java/org/lance/JNITest.java‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎protos/ann.proto‎
Lines changed: 1 addition & 0 deletions b/‎protos/ann.proto‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎python/python/lance/dataset.py‎
Lines changed: 30 additions & 0 deletions b/‎python/python/lance/dataset.py‎
Lines changed: 30 additions & 0 deletions
diff --git a/‎python/python/tests/test_vector_index.py‎
Lines changed: 35 additions & 0 deletions b/‎python/python/tests/test_vector_index.py‎
Lines changed: 35 additions & 0 deletions
diff --git a/‎python/src/dataset.rs‎
Lines changed: 29 additions & 2 deletions b/‎python/src/dataset.rs‎
Lines changed: 29 additions & 2 deletions
@@ -320,6 +320,11 @@ pub(crate) fn build_scanner_with_options<'a>(
 
         let use_index = env.get_boolean_from_method(&java_obj, "isUseIndex")?;
         scanner.use_index(use_index);
+
+        let query_parallelism = env
+            .call_method(&java_obj, "getQueryParallelism", "()I", &[])?
+            .i()?;
+        scanner.query_parallelism(query_parallelism);
         Ok(())
     })?;
 
 
@@ -207,6 +207,9 @@ pub fn get_query(env: &mut JNIEnv, query_obj: JObject) -> Result<Option<Query>>
         };
 
         let use_index = env.get_boolean_from_method(&java_obj, "isUseIndex")?;
+        let query_parallelism = env
+            .call_method(&java_obj, "getQueryParallelism", "()I", &[])?
+            .i()?;
 
         Ok(Query {
             column,
@@ -221,6 +224,7 @@ pub fn get_query(env: &mut JNIEnv, query_obj: JObject) -> Result<Option<Query>>
             metric_type: distance_type,
             use_index,
             dist_q_c: 0.0,
+            query_parallelism,
         })
     })?;
 
 
@@ -31,6 +31,7 @@ public class Query {
   private final Optional<Integer> refineFactor;
   private final Optional<DistanceType> distanceType;
   private final boolean useIndex;
+  private final int queryParallelism;
 
   private Query(Builder builder) {
     this.column = Preconditions.checkNotNull(builder.column, "Columns must be set");
@@ -50,6 +51,7 @@ private Query(Builder builder) {
     this.refineFactor = builder.refineFactor;
     this.distanceType = builder.distanceType;
     this.useIndex = builder.useIndex;
+    this.queryParallelism = builder.queryParallelism;
   }
 
   public String getColumn() {
@@ -92,6 +94,10 @@ public boolean isUseIndex() {
     return useIndex;
   }
 
+  public int getQueryParallelism() {
+    return queryParallelism;
+  }
+
   @Override
   public String toString() {
     return MoreObjects.toStringHelper(this)
@@ -104,6 +110,7 @@ public String toString() {
         .add("refineFactor", refineFactor.orElse(null))
         .add("distanceType", distanceType.orElse(null))
         .add("useIndex", useIndex)
+        .add("queryParallelism", queryParallelism)
         .toString();
   }
 
@@ -117,6 +124,7 @@ public static class Builder {
     private Optional<Integer> refineFactor = Optional.empty();
     private Optional<DistanceType> distanceType = Optional.empty();
     private boolean useIndex = true;
+    private int queryParallelism = 0;
 
     /**
      * Sets the column to be searched.
@@ -245,6 +253,24 @@ public Builder setUseIndex(boolean useIndex) {
       return this;
     }
 
+    /**
+     * Sets vector partition search concurrency for each query.
+     *
+     * <p>The default is 0. Value 0 uses the automatic policy, which currently maps to the
+     * single-worker sequential path. Value -1 uses the CPU pool size. Value 1 uses the
+     * single-worker sequential path. Values greater than or equal to 2 use the partition-parallel
+     * path and are clamped to the CPU pool size.
+     *
+     * @param queryParallelism The partition search concurrency policy.
+     * @return The Builder instance for method chaining.
+     */
+    public Builder setQueryParallelism(int queryParallelism) {
+      Preconditions.checkArgument(
+          queryParallelism >= -1, "Query parallelism must be greater than or equal to -1");
+      this.queryParallelism = queryParallelism;
+      return this;
+    }
+
     /**
      * Builds the Query object.
      *
 
@@ -59,6 +59,7 @@ public void testQuery() {
                 .setRefineFactor(40)
                 .setDistanceType(DistanceType.L2)
                 .setUseIndex(true)
+                .setQueryParallelism(-1)
                 .build()));
   }
 
 
@@ -25,6 +25,7 @@ message VectorQueryProto {
   optional lance.index.pb.VectorMetricType metric_type = 10;
   bool use_index = 11;
   optional float dist_q_c = 12;
+  optional int32 query_parallelism = 13;
 }
 
 // Serializable form of ANNIvfSubIndexExec — the IVF sub-index search node.
 
@@ -6,6 +6,7 @@
 import copy
 import dataclasses
 import json
+import operator
 import os
 import random
 import time
@@ -5631,8 +5632,21 @@ def nearest(
         refine_factor: Optional[int] = None,
         use_index: bool = True,
         ef: Optional[int] = None,
+        query_parallelism: Optional[int] = None,
         distance_range: Optional[tuple[Optional[float], Optional[float]]] = None,
     ) -> ScannerBuilder:
+        """Configure nearest neighbor search.
+
+        Parameters
+        ----------
+        query_parallelism: int, optional
+            Maximum partition-search concurrency for a single vector query.
+            The default is 0. Value 0 uses the automatic policy, which
+            currently maps to the single-worker sequential path. Value -1 uses
+            the CPU pool size. Value 1 uses the single-worker sequential path.
+            Values >= 2 use the partition-parallel path and are clamped to the
+            CPU pool size.
+        """
         self._nearest = _build_vector_search_query(
             column,
             q,
@@ -5645,6 +5659,7 @@ def nearest(
             refine_factor=refine_factor,
             use_index=use_index,
             ef=ef,
+            query_parallelism=query_parallelism,
             distance_range=distance_range,
         )
         return self
@@ -6760,6 +6775,7 @@ def _build_vector_search_query(
     refine_factor: Optional[int] = None,
     use_index: bool = True,
     ef: Optional[int] = None,
+    query_parallelism: Optional[int] = None,
     distance_range: Optional[tuple[Optional[float], Optional[float]]] = None,
 ) -> dict:
     """Configure nearest neighbor search.
@@ -6787,6 +6803,12 @@ def _build_vector_search_query(
         Whether to use the index for the search.
     ef: int, optional
         The ef parameter for HNSW search.
+    query_parallelism: int, optional
+        Maximum partition-search concurrency for a single vector query.
+        The default is 0. Value 0 uses the automatic policy, which currently
+        maps to the single-worker sequential path. Value -1 uses the CPU pool
+        size. Value 1 uses the single-worker sequential path. Values >= 2 use
+        the partition-parallel path and are clamped to the CPU pool size.
     distance_range: tuple[Optional[float], Optional[float]], optional
         A tuple of (lower_bound, upper_bound) to filter results by distance.
         Both bounds are optional. The lower bound is inclusive and the upper
@@ -6854,6 +6876,11 @@ def _build_vector_search_query(
         # `ef` should be >= `k`, but `k` could be None so we can't check it here
         # the rust code will check it
         raise ValueError(f"ef must be > 0 but got {ef}")
+    if query_parallelism is not None:
+        query_parallelism = operator.index(query_parallelism)
+
+    if query_parallelism is not None and query_parallelism < -1:
+        raise ValueError("query_parallelism must be >= -1")
 
     if distance_range is not None:
         if len(distance_range) != 2:
@@ -6871,6 +6898,7 @@ def _build_vector_search_query(
         "refine_factor": refine_factor,
         "use_index": use_index,
         "ef": ef,
+        "query_parallelism": query_parallelism,
         "distance_range": distance_range,
     }
 
@@ -7043,6 +7071,7 @@ def __init__(
         refine_factor: Optional[int] = None,
         use_index: bool = True,
         ef: Optional[int] = None,
+        query_parallelism: Optional[int] = None,
     ):
         self._inner = _build_vector_search_query(
             column,
@@ -7055,6 +7084,7 @@ def __init__(
             refine_factor=refine_factor,
             use_index=use_index,
             ef=ef,
+            query_parallelism=query_parallelism,
         )
 
     def inner(self):
 
@@ -1864,6 +1864,41 @@ def test_vector_index_with_nprobes(indexed_dataset):
     ).analyze_plan()
 
 
+def test_vector_index_with_query_parallelism(indexed_dataset):
+    q = np.random.randn(128)
+
+    sequential = indexed_dataset.to_table(
+        nearest={
+            "column": "vector",
+            "q": q,
+            "k": 10,
+            "query_parallelism": 0,
+        }
+    )
+    parallel = indexed_dataset.to_table(
+        nearest={
+            "column": "vector",
+            "q": q,
+            "k": 10,
+            "query_parallelism": -1,
+        }
+    )
+
+    assert sequential == parallel
+
+
+def test_vector_index_invalid_query_parallelism(indexed_dataset):
+    with pytest.raises(ValueError, match="query_parallelism"):
+        indexed_dataset.scanner(
+            nearest={
+                "column": "vector",
+                "q": np.random.randn(128),
+                "k": 10,
+                "query_parallelism": -2,
+            }
+        )
+
+
 def test_knn_deleted_rows(tmp_path):
     data = create_table()
     ds = lance.write_dataset(data, tmp_path)
 
@@ -77,8 +77,8 @@ use lance_index::{
     progress::{IndexBuildProgress, NoopIndexBuildProgress},
     scalar::{FullTextSearchQuery, InvertedIndexParams, ScalarIndexParams},
     vector::{
-        Query as VectorQuery, hnsw::builder::HnswBuildParams, ivf::IvfBuildParams,
-        pq::PQBuildParams, sq::builder::SQBuildParams,
+        DEFAULT_QUERY_PARALLELISM, Query as VectorQuery, hnsw::builder::HnswBuildParams,
+        ivf::IvfBuildParams, pq::PQBuildParams, sq::builder::SQBuildParams,
     },
 };
 use lance_index::{
@@ -1251,6 +1251,7 @@ impl Dataset {
                 refine_factor,
                 use_index,
                 ef,
+                query_parallelism,
             ) = vector_query_params_from_dict(nearest, default_k)?;
 
             let (_, element_type) = get_vector_type(self_.ds.schema(), &column)
@@ -1311,6 +1312,7 @@ impl Dataset {
                     if let Some(ef) = ef {
                         s = s.ef(ef);
                     }
+                    s = s.query_parallelism(query_parallelism);
                     s.use_index(use_index);
                     if let Some((lower, upper)) = distance_range {
                         s.distance_range(lower, upper);
@@ -4309,8 +4311,28 @@ type VectorQueryParams = (
     Option<u32>,
     bool,
     Option<usize>,
+    i32,
 );
 
+fn extract_query_parallelism(value: &Bound<'_, PyAny>) -> PyResult<i32> {
+    let query_parallelism = value.extract()?;
+    if query_parallelism < -1 {
+        Err(PyValueError::new_err("query_parallelism must be >= -1"))
+    } else {
+        Ok(query_parallelism)
+    }
+}
+
+fn vector_query_query_parallelism_from_dict(dict: &Bound<'_, PyDict>) -> PyResult<i32> {
+    if let Some(query_parallelism) = dict.get_item("query_parallelism")?
+        && !query_parallelism.is_none()
+    {
+        extract_query_parallelism(&query_parallelism)
+    } else {
+        Ok(DEFAULT_QUERY_PARALLELISM)
+    }
+}
+
 fn vector_query_params_from_dict(
     dict: &Bound<'_, PyDict>,
     default_k: usize,
@@ -4416,6 +4438,8 @@ fn vector_query_params_from_dict(
         None
     };
 
+    let query_parallelism = vector_query_query_parallelism_from_dict(dict)?;
+
     Ok((
         column,
         key,
@@ -4426,6 +4450,7 @@ fn vector_query_params_from_dict(
         refine_factor,
         use_index,
         ef,
+        query_parallelism,
     ))
 }
 
@@ -4461,6 +4486,7 @@ impl PySearchFilter {
             refine_factor,
             use_index,
             ef,
+            query_parallelism,
         ) = vector_query_params_from_dict(query, default_k)?;
 
         let metric_type = Some(metric_type_opt.unwrap_or(MetricType::L2));
@@ -4477,6 +4503,7 @@ impl PySearchFilter {
             refine_factor,
             metric_type,
             use_index,
+            query_parallelism,
             dist_q_c: 0.0,
         };
Original file line number	Diff line number	Diff line change
`@@ -59,6 +59,7 @@ public void testQuery() {`
`59`	`59`	`.setRefineFactor(40)`
`60`	`60`	`.setDistanceType(DistanceType.L2)`
`61`	`61`	`.setUseIndex(true)`
	`62`	`+ .setQueryParallelism(-1)`
`62`	`63`	`.build()));`
`63`	`64`	`}`
`64`	`65`
Original file line number	Diff line number	Diff line change
`@@ -25,6 +25,7 @@ message VectorQueryProto {`
`25`	`25`	`optional lance.index.pb.VectorMetricType metric_type = 10;`
`26`	`26`	`bool use_index = 11;`
`27`	`27`	`optional float dist_q_c = 12;`
	`28`	`+ optional int32 query_parallelism = 13;`
`28`	`29`	`}`
`29`	`30`
`30`	`31`	`// Serializable form of ANNIvfSubIndexExec — the IVF sub-index search node.`