feat(library-selection): #205 Phase 7 perf benchmarks (P-02, P-03) (#210)

zackees · claude · web-flow · commit 0bf4b2f3b429 · 2026-04-25T02:57:41.000-07:00
Adds two `criterion` benchmarks that capture baseline numbers for issue #205's Phase 7 perf gates. This PR lands the harness; CI gating against thresholds is a follow-up once we have a stable measurement on a known runner spec. ## Benchmarks - `crates/fbuild-header-scan/benches/scan_throughput.rs` Measures `scan()` throughput on three input sizes (tiny/medium/large) with adversary fixtures (raw strings, comments, identifiers ending in `R`/`L`, char literals). Target per #205 P-03: >= 50 MB/s single-thread. - `crates/fbuild-library-select/benches/resolve_cold.rs` End-to-end `resolve()` walk on a synthetic 30-library framework tree with a 5-level transitive include chain. Target per #205 P-02: <= 200 ms cold for a typical teensy41 project. Uses `MiniFramework` from `fbuild-test-support` so the bench is hermetic. Both use `harness = false` and depend on the new workspace `criterion = "0.5"` dev-dep. Run with: ```bash uv run soldr cargo bench -p fbuild-header-scan --bench scan_throughput uv run soldr cargo bench -p fbuild-library-select --bench resolve_cold ``` ## Out of scope (still tracked) - P-01 (warm matrix) — gated on Phase 4 cache (zccache#130). - P-04 (cache-hit round-trip) — same. - CI gating against the captured thresholds — follow-up once runner variance is characterized. ## Verification - `uv run soldr cargo build --release -p fbuild-header-scan -p fbuild-library-select --benches` — green. - `uv run soldr cargo clippy --workspace --all-targets -- -D warnings` — green. - `uv run soldr cargo fmt --all --check` — clean. Refs: #205, #202, #204 Co-authored-by: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
diff --git a/Cargo.lock b/Cargo.lock
diff --git a/Cargo.toml b/Cargo.toml
@@ -58,6 +58,7 @@ tokio-tungstenite = "0.24"
 async-trait = "0.1"
 dashmap = "6"
 blake3 = "1"
+criterion = { version = "0.5", default-features = false, features = ["html_reports"] }
 mimalloc = "0.1"
 object = { version = "0.36", default-features = false, features = ["read", "std", "elf", "write"] }
 rusqlite = { version = "0.31", features = ["bundled"] }
diff --git a/crates/fbuild-header-scan/Cargo.toml b/crates/fbuild-header-scan/Cargo.toml
@@ -9,4 +9,9 @@ license.workspace = true
 [dependencies]
 
 [dev-dependencies]
+criterion = { workspace = true }
 tempfile = { workspace = true }
+
+[[bench]]
+name = "scan_throughput"
+harness = false
diff --git a/crates/fbuild-header-scan/benches/README.md b/crates/fbuild-header-scan/benches/README.md
@@ -0,0 +1,20 @@
+# benches
+
+Criterion micro-benchmarks for `fbuild-header-scan`.
+
+`scan_throughput.rs` measures `scan()` single-thread throughput (MB/s) over
+three synthetic C++ fixtures: **tiny** (~64 B, per-call overhead),
+**medium** (100 KB), and **large** (2 MB, stand-in for a Teensy-core-sized
+translation unit). The fixtures exercise the scanner's adversary paths
+(comments, string / raw-string literals containing fake `#include`s,
+identifiers ending in `R` / `L`).
+
+Per FastLED/fbuild#205 P-03 the aspirational threshold is **≥ 50 MB/s
+single-thread**. This bench captures the baseline; it is not yet a CI
+gate (Phase 7 will wire that up in a follow-up).
+
+Run:
+
+```bash
+uv run soldr cargo bench -p fbuild-header-scan --bench scan_throughput
+```
diff --git a/crates/fbuild-header-scan/benches/scan_throughput.rs b/crates/fbuild-header-scan/benches/scan_throughput.rs
@@ -0,0 +1,59 @@
+//! Criterion benchmark for `fbuild_header_scan::scan` throughput.
+//!
+//! P-03 of FastLED/fbuild#205: capture single-thread MB/s on three input
+//! sizes (tiny / medium / large) so future PRs can regress against a
+//! recorded baseline. The aspirational threshold is ≥ 50 MB/s
+//! single-thread; this harness records the number but does not gate CI.
+
+use criterion::{black_box, criterion_group, criterion_main, Criterion, Throughput};
+use fbuild_header_scan::scan;
+
+/// Generate a synthetic C++ source string at least `target_bytes` long.
+///
+/// The template intentionally exercises the scanner's adversary paths:
+/// angled + quoted `#include`, line and multi-line block comments
+/// containing fake `#include`s, string and raw-string literals with
+/// embedded `#include` payloads, identifiers ending in `R` / `L`
+/// (which must NOT be treated as raw-string prefixes), and a char
+/// literal containing `#`. Repeated until we hit the byte budget.
+fn fixture(target_bytes: usize) -> String {
+    let template = "\
+        #include <a.h>\n\
+        // comment with #include <not_real.h>\n\
+        const char* s = \"#include <also_not_real.h>\";\n\
+        const char* r = R\"(#include <not_real_either.h>)\";\n\
+        auto FooR = 0; // identifier ending in R, NOT a raw string\n\
+        auto FooL = 1; // identifier ending in L, NOT a wide-string prefix\n\
+        /* block\n   #include <inside_block.h>\n*/\n\
+        char c = '#';\n\
+        #include \"b.h\"\n\
+    ";
+    let mut s = String::with_capacity(target_bytes + template.len());
+    while s.len() < target_bytes {
+        s.push_str(template);
+    }
+    s
+}
+
+fn bench_scanner(c: &mut Criterion) {
+    let mut group = c.benchmark_group("scan");
+    for (name, size) in [
+        ("tiny", 64usize),
+        ("medium", 100 * 1024),
+        ("large", 2 * 1024 * 1024),
+    ] {
+        let src = fixture(size);
+        let actual_len = src.len();
+        group.throughput(Throughput::Bytes(actual_len as u64));
+        group.bench_function(name, |b| {
+            b.iter(|| {
+                let refs = scan(black_box(&src));
+                black_box(refs);
+            });
+        });
+    }
+    group.finish();
+}
+
+criterion_group!(benches, bench_scanner);
+criterion_main!(benches);
diff --git a/crates/fbuild-library-select/Cargo.toml b/crates/fbuild-library-select/Cargo.toml
@@ -14,3 +14,9 @@ walkdir = { workspace = true }
 
 [dev-dependencies]
 tempfile = { workspace = true }
+criterion = { workspace = true }
+fbuild-test-support = { path = "../fbuild-test-support" }
+
+[[bench]]
+name = "resolve_cold"
+harness = false
diff --git a/crates/fbuild-library-select/benches/README.md b/crates/fbuild-library-select/benches/README.md
@@ -0,0 +1,23 @@
+# fbuild-library-select benches
+
+Criterion benchmarks for the PlatformIO-LDF-style library resolver.
+
+## resolve_cold
+
+End-to-end cold-path measurement of `resolve()` against a synthetic
+~30-library framework tree (Teensyduino-class) built with `MiniFramework`. A
+5-deep transitive include chain forces the two-pass LDF reconciliation; the
+remaining libraries are unreferenced and must be rejected — that doubles as a
+guard against the #204 over-selection regression. Walks the tempdir on every
+iteration since no cache sits in front of `resolve()` today (Phase 4
+memoization waits on zccache#130).
+
+The Phase 7 P-02 threshold from FastLED/fbuild#205 is **≤ 200 ms cold for a
+typical teensy41 project**. This bench captures the baseline; future PRs gate
+against it.
+
+Run:
+
+```bash
+uv run soldr cargo bench -p fbuild-library-select --bench resolve_cold
+```
diff --git a/crates/fbuild-library-select/benches/resolve_cold.rs b/crates/fbuild-library-select/benches/resolve_cold.rs