lance-format
diff --git a/‎lance-spark-base_2.12/src/main/java/org/lance/spark/LanceSparkReadOptions.java‎
Lines changed: 6 additions & 6 deletions b/‎lance-spark-base_2.12/src/main/java/org/lance/spark/LanceSparkReadOptions.java‎
Lines changed: 6 additions & 6 deletions
diff --git a/‎lance-spark-base_2.12/src/main/java/org/lance/spark/read/LanceScan.java‎
Lines changed: 31 additions & 8 deletions b/‎lance-spark-base_2.12/src/main/java/org/lance/spark/read/LanceScan.java‎
Lines changed: 31 additions & 8 deletions
diff --git a/‎lance-spark-base_2.12/src/main/java/org/lance/spark/read/LanceScanBuilder.java‎
Lines changed: 116 additions & 100 deletions b/‎lance-spark-base_2.12/src/main/java/org/lance/spark/read/LanceScanBuilder.java‎
Lines changed: 116 additions & 100 deletions
@@ -107,7 +107,7 @@ public class LanceSparkReadOptions implements Serializable {
   private final String datasetName;
   private final boolean pushDownFilters;
   private final Integer blockSize;
-  private final Integer version;
+  private final Long version;
   private final Integer indexCacheSize;
   private final Integer metadataCacheSize;
   private final int batchSize;
@@ -238,7 +238,7 @@ public Integer getBlockSize() {
     return blockSize;
   }
 
-  public Integer getVersion() {
+  public Long getVersion() {
     return version;
   }
 
@@ -312,7 +312,7 @@ public void setNamespace(LanceNamespace namespace) {
    * @param newVersion the version to use
    * @return a new LanceSparkReadOptions with the specified version
    */
-  public LanceSparkReadOptions withVersion(int newVersion) {
+  public LanceSparkReadOptions withVersion(long newVersion) {
     return builder()
         .datasetUri(this.datasetUri)
         .pushDownFilters(this.pushDownFilters)
@@ -411,7 +411,7 @@ public static class Builder {
     private boolean pushDownFilters = DEFAULT_PUSH_DOWN_FILTERS;
     private Integer blockSize;
     private Query nearest;
-    private Integer version;
+    private Long version;
     private Integer indexCacheSize;
     private Integer metadataCacheSize;
     private int batchSize = DEFAULT_BATCH_SIZE;
@@ -453,7 +453,7 @@ public Builder nearest(String json) {
       return this;
     }
 
-    public Builder version(Integer version) {
+    public Builder version(Long version) {
       this.version = version;
       return this;
     }
@@ -546,7 +546,7 @@ private void parseTypedFlags(Map<String, String> opts) {
         this.blockSize = Integer.parseInt(opts.get(CONFIG_BLOCK_SIZE));
       }
       if (opts.containsKey(CONFIG_VERSION)) {
-        this.version = Integer.parseInt(opts.get(CONFIG_VERSION));
+        this.version = Long.parseLong(opts.get(CONFIG_VERSION));
       }
       if (opts.containsKey(CONFIG_INDEX_CACHE_SIZE)) {
         this.indexCacheSize = Integer.parseInt(opts.get(CONFIG_INDEX_CACHE_SIZE));
 
@@ -89,6 +89,22 @@ public class LanceScan
    */
   private final Set<Integer> cachedSurvivingFragmentIds;
 
+  /**
+   * Splits pre-computed on the driver during {@link LanceScanBuilder#build()}. Each entry is one
+   * fragment. Built from a single {@code Dataset} handle that was already opened for manifest /
+   * schema / zonemap loading, so no second {@code Dataset.open()} is needed at {@link
+   * #planInputPartitions()} time.
+   */
+  private final List<LanceSplit> precomputedSplits;
+
+  /**
+   * Per-fragment logical row counts (after deletions), captured together with {@link
+   * #precomputedSplits} on the driver. Consumed by {@link #pruneByLimit}. Not declared {@code
+   * transient} because Java deserialization would skip the constructor and leave the field {@code
+   * null}, which would NPE inside {@link #pruneByLimit}.
+   */
+  private final java.util.Map<Integer, Long> precomputedFragmentRowCounts;
+
   /** Number of partitions after pruning, set during {@link #planInputPartitions()}. */
   private transient int numPartitions = -1;
 
@@ -121,6 +137,8 @@ public LanceScan(
       LanceStatistics statistics,
       java.util.Map<String, List<ZoneStats>> zonemapStats,
       Set<Integer> survivingFragmentIds,
+      List<LanceSplit> precomputedSplits,
+      java.util.Map<Integer, Long> precomputedFragmentRowCounts,
       Expression activeShardingExpression,
       java.util.Map<Integer, Object> fragmentShardingKeys,
       java.util.Map<String, String> initialStorageOptions,
@@ -140,6 +158,11 @@ public LanceScan(
     this.statistics = statistics;
     this.zonemapStats = zonemapStats != null ? zonemapStats : Collections.emptyMap();
     this.cachedSurvivingFragmentIds = survivingFragmentIds;
+    this.precomputedSplits = precomputedSplits;
+    this.precomputedFragmentRowCounts =
+        precomputedFragmentRowCounts != null
+            ? precomputedFragmentRowCounts
+            : Collections.emptyMap();
     this.activeShardingExpression = activeShardingExpression;
     this.fragmentShardingKeys = fragmentShardingKeys;
     this.initialStorageOptions = initialStorageOptions;
@@ -154,8 +177,10 @@ public Batch toBatch() {
 
   @Override
   public InputPartition[] planInputPartitions() {
-    LanceSplit.ScanPlanResult planResult = LanceSplit.planScan(readOptions);
-    List<LanceSplit> prunedSplits = pruneByRowAddrFilters(planResult.getSplits());
+    // Splits and per-fragment row counts are pre-computed on the driver during
+    // LanceScanBuilder.build() from the same Dataset handle that loaded manifest /
+    // schema / zonemap stats. This avoids a second Dataset.open() at plan time.
+    List<LanceSplit> prunedSplits = pruneByRowAddrFilters(precomputedSplits);
 
     // Zonemap-based fragment pruning: uses per-column min/max/null_count
     // statistics to eliminate fragments that provably cannot match
@@ -166,15 +191,13 @@ public InputPartition[] planInputPartitions() {
     // use per-fragment row counts to plan only enough splits to satisfy the limit.
     // This avoids scheduling hundreds of unnecessary tasks. Correctness is guaranteed
     // because Spark still keeps a global CollectLimit on top (isPartiallyPushed = true).
-    prunedSplits = pruneByLimit(prunedSplits, planResult.getFragmentRowCounts());
+    prunedSplits = pruneByLimit(prunedSplits, precomputedFragmentRowCounts);
 
     // Capture as effectively final for use in lambda
     final List<LanceSplit> finalSplits = prunedSplits;
 
-    // Use resolved version for snapshot isolation - ensures all workers read the same version
-    LanceSparkReadOptions resolvedReadOptions =
-        readOptions.withVersion((int) planResult.getResolvedVersion());
-
+    // readOptions is already pinned to the resolved version by LanceScanBuilder for
+    // snapshot isolation across all workers.
     InputPartition[] result =
         IntStream.range(0, finalSplits.size())
             .mapToObj(
@@ -192,7 +215,7 @@ public InputPartition[] planInputPartitions() {
                       schema,
                       i,
                       split,
-                      resolvedReadOptions,
+                      readOptions,
                       whereConditions,
                       limit,
                       offset,
 
@@ -147,113 +147,129 @@ private void closeLazyDataset() {
 
   @Override
   public Scan build() {
-    // Return LocalScan if we have a metadata-only aggregation result
-    if (localScan != null) {
-      closeLazyDataset();
-      return localScan;
-    }
+    // Wrap the entire planning body in try/finally to guarantee that the lazily-opened native
+    // dataset handle (lazyDataset) is always released, including when intermediate steps such as
+    // zonemap loading or LanceSplit.planScan(dataset) throw.
+    try {
+      // Return LocalScan if we have a metadata-only aggregation result
+      if (localScan != null) {
+        return localScan;
+      }
 
-    // Get statistics from manifest summary before closing dataset
-    ManifestSummary summary = getOrOpenDataset().getVersion().getManifestSummary();
-
-    // Collect all columns that need zonemap stats: filter columns + sharding columns.
-    Set<String> columnsToLoad = extractReferencedColumns(pushedPredicates);
-    Dataset dataset = getOrOpenDataset();
-    LanceSchema lanceSchema = dataset.getLanceSchema();
-    ShardingSpec activeShardingSpec =
-        SparkLanceShardingUtils.isEmpty(shardingSpec)
-            ? SparkLanceShardingUtils.firstShardingSpec(dataset)
-            : shardingSpec;
-    for (ShardingField field : SparkLanceShardingUtils.fields(activeShardingSpec)) {
-      columnsToLoad.add(SparkLanceShardingUtils.columnName(field, lanceSchema));
-    }
+      // Get statistics from manifest summary before closing dataset
+      ManifestSummary summary = getOrOpenDataset().getVersion().getManifestSummary();
+
+      // Collect all columns that need zonemap stats: filter columns + sharding columns.
+      Set<String> columnsToLoad = extractReferencedColumns(pushedPredicates);
+      Dataset dataset = getOrOpenDataset();
+      LanceSchema lanceSchema = dataset.getLanceSchema();
+      ShardingSpec activeShardingSpec =
+          SparkLanceShardingUtils.isEmpty(shardingSpec)
+              ? SparkLanceShardingUtils.firstShardingSpec(dataset)
+              : shardingSpec;
+      for (ShardingField field : SparkLanceShardingUtils.fields(activeShardingSpec)) {
+        columnsToLoad.add(SparkLanceShardingUtils.columnName(field, lanceSchema));
+      }
 
-    // Load zonemap stats for all requested columns in one pass.
-    Map<String, List<ZoneStats>> zonemapStats = loadZonemapStats(getOrOpenDataset(), columnsToLoad);
-
-    // Detect sharding-compatible fragments from zonemap stats. Each field checks its column's
-    // zones; if every fragment has a single sharding value, we get a fragment-to-key map.
-    Map<Integer, Object> fragmentShardingKeys = null;
-    Expression activeShardingExpression = null;
-    for (ShardingField field : SparkLanceShardingUtils.fields(activeShardingSpec)) {
-      String column = SparkLanceShardingUtils.columnName(field, lanceSchema);
-      List<ZoneStats> colStats = zonemapStats.get(column);
-      if (colStats == null || colStats.isEmpty()) {
-        LOG.warn(
-            "Sharding column '{}' (transform={}) has no zonemap stats; sharding detection disabled",
-            column,
-            field.transform().orElse(null));
-        continue;
+      // Load zonemap stats for all requested columns in one pass.
+      Map<String, List<ZoneStats>> zonemapStats =
+          loadZonemapStats(getOrOpenDataset(), columnsToLoad);
+
+      // Detect sharding-compatible fragments from zonemap stats. Each field checks its column's
+      // zones; if every fragment has a single sharding value, we get a fragment-to-key map.
+      Map<Integer, Object> fragmentShardingKeys = null;
+      Expression activeShardingExpression = null;
+      for (ShardingField field : SparkLanceShardingUtils.fields(activeShardingSpec)) {
+        String column = SparkLanceShardingUtils.columnName(field, lanceSchema);
+        List<ZoneStats> colStats = zonemapStats.get(column);
+        if (colStats == null || colStats.isEmpty()) {
+          LOG.warn(
+              "Sharding column '{}' (transform={}) has no zonemap stats;"
+                  + " sharding detection disabled",
+              column,
+              field.transform().orElse(null));
+          continue;
+        }
+        java.util.Optional<Map<Integer, Object>> keys =
+            SparkLanceShardingUtils.detectFragmentKeys(field, lanceSchema, colStats);
+        if (keys.isPresent()) {
+          fragmentShardingKeys = keys.get();
+          activeShardingExpression = SparkLanceShardingUtils.toSparkExpression(field, lanceSchema);
+          LOG.info(
+              "Detected Lance sharding field {}('{}') with {} fragments",
+              field.transform().orElse(null),
+              column,
+              fragmentShardingKeys.size());
+          break;
+        }
       }
-      java.util.Optional<Map<Integer, Object>> keys =
-          SparkLanceShardingUtils.detectFragmentKeys(field, lanceSchema, colStats);
-      if (keys.isPresent()) {
-        fragmentShardingKeys = keys.get();
-        activeShardingExpression = SparkLanceShardingUtils.toSparkExpression(field, lanceSchema);
-        LOG.info(
-            "Detected Lance sharding field {}('{}') with {} fragments",
-            field.transform().orElse(null),
-            column,
-            fragmentShardingKeys.size());
-        break;
+
+      // Pre-compute fragment pruning so we can (a) estimate post-pruning statistics for
+      // JoinSelection (BroadcastHashJoin vs SortMergeJoin) and (b) pass the cached result
+      // to LanceScan to avoid re-computing during planInputPartitions().
+      Set<Integer> survivingFragmentIds = null;
+      if (pushedPredicates.length > 0 && !zonemapStats.isEmpty()) {
+        survivingFragmentIds =
+            ZonemapFragmentPruner.pruneFragments(pushedPredicates, zonemapStats).orElse(null);
       }
-    }
 
-    // Pre-compute fragment pruning so we can (a) estimate post-pruning statistics for
-    // JoinSelection (BroadcastHashJoin vs SortMergeJoin) and (b) pass the cached result
-    // to LanceScan to avoid re-computing during planInputPartitions().
-    Set<Integer> survivingFragmentIds = null;
-    if (pushedPredicates.length > 0 && !zonemapStats.isEmpty()) {
-      survivingFragmentIds =
-          ZonemapFragmentPruner.pruneFragments(pushedPredicates, zonemapStats).orElse(null);
-    }
+      // Scale rows and full size by the zonemap fragment-pruning ratio first, then let
+      // LanceStatistics.estimateProjected apply the column-width ratio on top
+      // (when the projected schema is narrower than the full schema).
+      long projectedRows = summary.getTotalRows();
+      long projectedFullSize = summary.getTotalFilesSize();
+      if (survivingFragmentIds != null && summary.getTotalFragments() > 0) {
+        double ratio = (double) survivingFragmentIds.size() / summary.getTotalFragments();
+        projectedRows = (long) (projectedRows * ratio);
+        projectedFullSize = (long) (projectedFullSize * ratio);
+      }
+      LanceStatistics statistics =
+          LanceStatistics.estimateProjected(projectedRows, projectedFullSize, fullSchema, schema);
+      if (survivingFragmentIds != null) {
+        LOG.debug(
+            "Scan statistics after pruning: {} of {} fragments survive,"
+                + " estimatedSize={}, estimatedRows={} (full: size={}, rows={})",
+            survivingFragmentIds.size(),
+            summary.getTotalFragments(),
+            statistics.sizeInBytes(),
+            statistics.numRows(),
+            summary.getTotalFilesSize(),
+            summary.getTotalRows());
+      }
 
-    // Scale rows and full size by the zonemap fragment-pruning ratio first, then let
-    // LanceStatistics.estimateProjected apply the column-width ratio on top
-    // (when the projected schema is narrower than the full schema).
-    long projectedRows = summary.getTotalRows();
-    long projectedFullSize = summary.getTotalFilesSize();
-    if (survivingFragmentIds != null && summary.getTotalFragments() > 0) {
-      double ratio = (double) survivingFragmentIds.size() / summary.getTotalFragments();
-      projectedRows = (long) (projectedRows * ratio);
-      projectedFullSize = (long) (projectedFullSize * ratio);
-    }
-    LanceStatistics statistics =
-        LanceStatistics.estimateProjected(projectedRows, projectedFullSize, fullSchema, schema);
-    if (survivingFragmentIds != null) {
-      LOG.debug(
-          "Scan statistics after pruning: {} of {} fragments survive,"
-              + " estimatedSize={}, estimatedRows={} (full: size={}, rows={})",
-          survivingFragmentIds.size(),
-          summary.getTotalFragments(),
-          statistics.sizeInBytes(),
-          statistics.numRows(),
-          summary.getTotalFilesSize(),
-          summary.getTotalRows());
+      // Pre-compute splits and per-fragment row counts from the same Dataset handle that we
+      // already opened above. This consolidates two driver-side opens into one and lets us pin
+      // the resolved version onto the read options shipped to workers, providing snapshot
+      // isolation across all tasks of this query. The version is kept as a long end-to-end so
+      // long-lived high-write-frequency datasets do not silently truncate to a wrong version.
+      LanceSplit.ScanPlanResult scanPlan = LanceSplit.planScan(dataset);
+      LanceSparkReadOptions resolvedReadOptions =
+          readOptions.withVersion(scanPlan.getResolvedVersion());
+
+      Optional<String> whereCondition =
+          FilterPushDown.compileFiltersToSqlWhereClause(pushedPredicates);
+      return new LanceScan(
+          schema,
+          resolvedReadOptions,
+          whereCondition,
+          limit,
+          offset,
+          topNSortOrders,
+          pushedAggregation,
+          pushedPredicates,
+          statistics,
+          zonemapStats,
+          survivingFragmentIds,
+          scanPlan.getSplits(),
+          scanPlan.getFragmentRowCounts(),
+          activeShardingExpression,
+          fragmentShardingKeys,
+          initialStorageOptions,
+          namespaceImpl,
+          namespaceProperties);
+    } finally {
+      closeLazyDataset();
     }
-
-    // Close the lazily opened dataset - it's no longer needed after build
-    closeLazyDataset();
-
-    Optional<String> whereCondition =
-        FilterPushDown.compileFiltersToSqlWhereClause(pushedPredicates);
-    return new LanceScan(
-        schema,
-        readOptions,
-        whereCondition,
-        limit,
-        offset,
-        topNSortOrders,
-        pushedAggregation,
-        pushedPredicates,
-        statistics,
-        zonemapStats,
-        survivingFragmentIds,
-        activeShardingExpression,
-        fragmentShardingKeys,
-        initialStorageOptions,
-        namespaceImpl,
-        namespaceProperties);
   }
 
   @Override