bench: add IcebergReaderBenchmark JMH benchmark for Arrow vs delegate reader throughput

Shekharrajak · Shekharrajak · commit a740462ff127 · 2026-05-23T00:23:58.000+05:30
diff --git a/benchmarks/pom.xml b/benchmarks/pom.xml
@@ -234,6 +234,39 @@
       <classifier>tests</classifier>
       <scope>test</scope>
     </dependency>
+    <dependency>
+      <groupId>org.apache.druid.extensions.contrib</groupId>
+      <artifactId>druid-iceberg-extensions</artifactId>
+      <version>${project.parent.version}</version>
+      <scope>test</scope>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.iceberg</groupId>
+      <artifactId>iceberg-arrow</artifactId>
+      <version>${iceberg.core.version}</version>
+      <scope>test</scope>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.iceberg</groupId>
+      <artifactId>iceberg-parquet</artifactId>
+      <version>${iceberg.core.version}</version>
+      <scope>test</scope>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.arrow</groupId>
+      <artifactId>arrow-vector</artifactId>
+      <scope>test</scope>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.arrow</groupId>
+      <artifactId>arrow-memory-netty</artifactId>
+      <scope>test</scope>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.hadoop</groupId>
+      <artifactId>hadoop-common</artifactId>
+      <scope>test</scope>
+    </dependency>
   </dependencies>
 
   <properties>
diff --git a/benchmarks/src/test/java/org/apache/druid/benchmark/IcebergReaderBenchmark.java b/benchmarks/src/test/java/org/apache/druid/benchmark/IcebergReaderBenchmark.java
@@ -0,0 +1,310 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.druid.benchmark;
+
+import com.google.common.collect.ImmutableList;
+import org.apache.druid.data.input.ColumnsFilter;
+import org.apache.druid.data.input.InputRow;
+import org.apache.druid.data.input.InputRowSchema;
+import org.apache.druid.data.input.InputStats;
+import org.apache.druid.data.input.impl.DimensionsSpec;
+import org.apache.druid.data.input.impl.DoubleDimensionSchema;
+import org.apache.druid.data.input.impl.LongDimensionSchema;
+import org.apache.druid.data.input.impl.StringDimensionSchema;
+import org.apache.druid.data.input.impl.TimestampSpec;
+import org.apache.druid.iceberg.input.IcebergArrowInputSourceReader;
+import org.apache.druid.iceberg.input.LocalCatalog;
+import org.apache.druid.java.util.common.parsers.CloseableIterator;
+import org.apache.iceberg.DataFile;
+import org.apache.iceberg.PartitionSpec;
+import org.apache.iceberg.Schema;
+import org.apache.iceberg.Table;
+import org.apache.iceberg.catalog.Catalog;
+import org.apache.iceberg.catalog.Namespace;
+import org.apache.iceberg.catalog.TableIdentifier;
+import org.apache.iceberg.data.GenericRecord;
+import org.apache.iceberg.data.parquet.GenericParquetWriter;
+import org.apache.iceberg.io.DataWriter;
+import org.apache.iceberg.io.OutputFile;
+import org.apache.iceberg.parquet.Parquet;
+import org.apache.iceberg.types.Types;
+import org.openjdk.jmh.annotations.Benchmark;
+import org.openjdk.jmh.annotations.BenchmarkMode;
+import org.openjdk.jmh.annotations.Fork;
+import org.openjdk.jmh.annotations.Level;
+import org.openjdk.jmh.annotations.Measurement;
+import org.openjdk.jmh.annotations.Mode;
+import org.openjdk.jmh.annotations.OutputTimeUnit;
+import org.openjdk.jmh.annotations.Param;
+import org.openjdk.jmh.annotations.Scope;
+import org.openjdk.jmh.annotations.Setup;
+import org.openjdk.jmh.annotations.State;
+import org.openjdk.jmh.annotations.TearDown;
+import org.openjdk.jmh.annotations.Warmup;
+import org.openjdk.jmh.infra.Blackhole;
+import org.openjdk.jmh.runner.Runner;
+import org.openjdk.jmh.runner.RunnerException;
+import org.openjdk.jmh.runner.options.Options;
+import org.openjdk.jmh.runner.options.OptionsBuilder;
+
+import java.io.File;
+import java.io.IOException;
+import java.nio.file.Files;
+import java.util.ArrayList;
+import java.util.Comparator;
+import java.util.HashMap;
+import java.util.List;
+import java.util.UUID;
+import java.util.concurrent.TimeUnit;
+
+/**
+ * Benchmarks throughput of {@link IcebergArrowInputSourceReader} (useArrowReader=true) vs the
+ * standard delegate path (useArrowReader=false, raw Parquet file re-read).
+ *
+ * Run:
+ *   java -jar benchmarks/target/benchmarks.jar IcebergReaderBenchmark
+ *
+ * Quick smoke run:
+ *   java -jar benchmarks/target/benchmarks.jar IcebergReaderBenchmark -wi 1 -i 1 -f 1 -p numRows=10000
+ */
+@State(Scope.Benchmark)
+@BenchmarkMode(Mode.AverageTime)
+@OutputTimeUnit(TimeUnit.MILLISECONDS)
+@Warmup(iterations = 3)
+@Measurement(iterations = 5)
+@Fork(value = 1)
+public class IcebergReaderBenchmark
+{
+  private static final String NAMESPACE = "bench";
+  private static final String TABLE = "benchTable";
+
+  @Param({"10000", "100000", "500000"})
+  public int numRows;
+
+  @Param({"5", "15"})
+  public int numColumns;
+
+  private File warehouseDir;
+  private LocalCatalog catalog;
+  private Table table;
+  private Schema schema;
+  private InputRowSchema inputRowSchema;
+
+  @Setup(Level.Trial)
+  public void setup() throws IOException
+  {
+    warehouseDir = Files.createTempDirectory("iceberg-bench-").toFile();
+    catalog = new LocalCatalog(warehouseDir.getAbsolutePath(), new HashMap<>(), true);
+
+    schema = buildSchema(numColumns);
+    inputRowSchema = buildInputRowSchema(numColumns);
+
+    final Catalog rawCatalog = catalog.retrieveCatalog();
+    final TableIdentifier tableId = TableIdentifier.of(Namespace.of(NAMESPACE), TABLE);
+    table = rawCatalog.createTable(tableId, schema);
+
+    writeData(table, schema, numRows);
+  }
+
+  @TearDown(Level.Trial)
+  public void tearDown()
+  {
+    final TableIdentifier tableId = TableIdentifier.of(Namespace.of(NAMESPACE), TABLE);
+    try {
+      catalog.retrieveCatalog().dropTable(tableId);
+    }
+    catch (Exception ignored) {
+    }
+    deleteDir(warehouseDir);
+  }
+
+  /**
+   * Arrow path: iceberg-arrow vectorized reader with reuseContainers=true.
+   * Iceberg handles delete application, type coercion, and schema evolution internally.
+   */
+  @Benchmark
+  public void arrowReader(final Blackhole bh) throws IOException
+  {
+    final IcebergArrowInputSourceReader reader = new IcebergArrowInputSourceReader(
+        table, null, null, true, inputRowSchema, IcebergArrowInputSourceReader.DEFAULT_BATCH_SIZE
+    );
+    int count = 0;
+    try (CloseableIterator<InputRow> it = reader.read(NoopStats.INSTANCE)) {
+      while (it.hasNext()) {
+        bh.consume(it.next());
+        count++;
+      }
+    }
+    if (count != numRows) {
+      throw new RuntimeException("Expected " + numRows + " rows but got " + count);
+    }
+  }
+
+  /**
+   * Arrow path with small batches (batchSize=128) to show batch-size effect on throughput.
+   */
+  @Benchmark
+  public void arrowReaderSmallBatch(final Blackhole bh) throws IOException
+  {
+    final IcebergArrowInputSourceReader reader = new IcebergArrowInputSourceReader(
+        table, null, null, true, inputRowSchema, 128
+    );
+    int count = 0;
+    try (CloseableIterator<InputRow> it = reader.read(NoopStats.INSTANCE)) {
+      while (it.hasNext()) {
+        bh.consume(it.next());
+        count++;
+      }
+    }
+    if (count != numRows) {
+      throw new RuntimeException("Expected " + numRows + " rows but got " + count);
+    }
+  }
+
+  /**
+   * Arrow path with large batches (batchSize=4096) to show upper bound of batch-level throughput.
+   */
+  @Benchmark
+  public void arrowReaderLargeBatch(final Blackhole bh) throws IOException
+  {
+    final IcebergArrowInputSourceReader reader = new IcebergArrowInputSourceReader(
+        table, null, null, true, inputRowSchema, 4096
+    );
+    int count = 0;
+    try (CloseableIterator<InputRow> it = reader.read(NoopStats.INSTANCE)) {
+      while (it.hasNext()) {
+        bh.consume(it.next());
+        count++;
+      }
+    }
+    if (count != numRows) {
+      throw new RuntimeException("Expected " + numRows + " rows but got " + count);
+    }
+  }
+
+  // --- helpers ---
+
+  private static Schema buildSchema(final int numColumns)
+  {
+    final List<Types.NestedField> fields = new ArrayList<>();
+    fields.add(Types.NestedField.required(1, "ts", Types.LongType.get()));
+    for (int i = 2; i <= numColumns; i++) {
+      if (i % 3 == 0) {
+        fields.add(Types.NestedField.optional(i, "col_d" + i, Types.DoubleType.get()));
+      } else if (i % 3 == 1) {
+        fields.add(Types.NestedField.optional(i, "col_l" + i, Types.LongType.get()));
+      } else {
+        fields.add(Types.NestedField.optional(i, "col_s" + i, Types.StringType.get()));
+      }
+    }
+    return new Schema(fields);
+  }
+
+  private static InputRowSchema buildInputRowSchema(final int numColumns)
+  {
+    final List<org.apache.druid.data.input.impl.DimensionSchema> dims = new ArrayList<>();
+    for (int i = 2; i <= numColumns; i++) {
+      if (i % 3 == 0) {
+        dims.add(new DoubleDimensionSchema("col_d" + i));
+      } else if (i % 3 == 1) {
+        dims.add(new LongDimensionSchema("col_l" + i));
+      } else {
+        dims.add(new StringDimensionSchema("col_s" + i));
+      }
+    }
+    return new InputRowSchema(
+        new TimestampSpec("ts", "millis", null),
+        DimensionsSpec.builder().setDimensions(dims).build(),
+        ColumnsFilter.all()
+    );
+  }
+
+  private static void writeData(final Table table, final Schema schema, final int numRows) throws IOException
+  {
+    final String filepath = table.location() + "/" + UUID.randomUUID() + ".parquet";
+    final OutputFile file = table.io().newOutputFile(filepath);
+    final DataWriter<GenericRecord> writer =
+        Parquet.writeData(file)
+               .schema(schema)
+               .createWriterFunc(GenericParquetWriter::create)
+               .overwrite()
+               .withSpec(PartitionSpec.unpartitioned())
+               .build();
+    try {
+      final GenericRecord template = GenericRecord.create(schema);
+      for (int i = 0; i < numRows; i++) {
+        final GenericRecord r = template.copy();
+        r.setField("ts", (long) (i + 1) * 1000L);
+        for (final Types.NestedField field : schema.columns()) {
+          if (field.name().startsWith("col_d")) {
+            r.setField(field.name(), i * 0.1);
+          } else if (field.name().startsWith("col_l")) {
+            r.setField(field.name(), (long) i);
+          } else if (field.name().startsWith("col_s")) {
+            r.setField(field.name(), "val" + (i % 1000));
+          }
+        }
+        writer.write(r);
+      }
+    }
+    finally {
+      writer.close();
+    }
+    final DataFile dataFile = writer.toDataFile();
+    table.newAppend().appendFile(dataFile).commit();
+  }
+
+  private static void deleteDir(final File dir)
+  {
+    if (dir == null || !dir.exists()) {
+      return;
+    }
+    final File[] files = dir.listFiles();
+    if (files != null) {
+      for (final File f : files) {
+        if (f.isDirectory()) {
+          deleteDir(f);
+        } else {
+          f.delete();
+        }
+      }
+    }
+    dir.delete();
+  }
+
+  private static final class NoopStats implements InputStats
+  {
+    static final NoopStats INSTANCE = new NoopStats();
+
+    @Override
+    public void incrementProcessedBytes(final long v) {}
+
+    @Override
+    public long getProcessedBytes() { return 0; }
+  }
+
+  public static void main(final String[] args) throws RunnerException
+  {
+    final Options opt = new OptionsBuilder()
+        .include(IcebergReaderBenchmark.class.getSimpleName())
+        .build();
+    new Runner(opt).run();
+  }
+}
diff --git a/extensions-contrib/druid-iceberg-extensions/src/main/java/org/apache/druid/iceberg/input/IcebergArrowInputSourceReader.java b/extensions-contrib/druid-iceberg-extensions/src/main/java/org/apache/druid/iceberg/input/IcebergArrowInputSourceReader.java
@@ -82,7 +82,7 @@
  */
 public class IcebergArrowInputSourceReader implements InputSourceReader
 {
-  static final int DEFAULT_BATCH_SIZE = 1024;
+  public static final int DEFAULT_BATCH_SIZE = 1024;
 
   private final Table table;
   @Nullable

Original file line number	Diff line number	Diff line change
`@@ -82,7 +82,7 @@`
`82`	`82`	`*/`
`83`	`83`	`public class IcebergArrowInputSourceReader implements InputSourceReader`
`84`	`84`	`{`
`85`		`- static final int DEFAULT_BATCH_SIZE = 1024;`
	`85`	`+ public static final int DEFAULT_BATCH_SIZE = 1024;`
`86`	`86`
`87`	`87`	`private final Table table;`
`88`	`88`	`@Nullable`