fix(spine): address PR #432 opus 4.8 reviewer findings

claude · claude · commit 0e5ab9852d6c · 2026-05-29T10:28:09.000Z
Three correctness bugs + one architectural disclaimer + three polish items from the PR review pass. No new dependencies; all tests green. ## Bugs fixed ### 1. roundtrip_eq truth check inverted from default semantics (codegen_spine.rs:161 — `if tol > 0.0` gated the entire check) The doc claimed `truth_tolerance() = 0.0` meant "lossless / strictest." The code SKIPPED the truth check when tol = 0.0, so a projection that zeroed every (f, c) round-tripped green with no truth validation. The default-case bug was masked because the existing LossyDropFrequency test overrides tolerance to 0.01. Fix: drop the `if tol > 0.0` gate; the `abs() > tol` comparison naturally treats 0.0 as "any difference fails." Doc reworded to clarify "0.0 requires exact match; override to allow quantization." New test `default_tolerance_requires_exact_truth_match` pins the fix: a `TruthMangler` projection (preserves s/p/o, zeros f/c) MUST fail with the default tolerance. ### 2. parse_triples silently dropped malformed lines (odoo_ontology.rs:73-83 — `filter_map(|l| serde_json::from_str(l).ok())`) Lines that fail JSON parse were silently dropped. The `parses_all_triples` count assertion would catch *some* drift but a corrupted line that happens to keep counts aligned would go silent. Fix: new test `every_nonempty_line_parses` asserts the raw non-empty line count equals `parse_triples(ndjson).len()` — any silent drop fires the assertion. (Kept `parse_triples` returning `Vec` for API stability; the test catches what an error-returning API would.) ### 3. load_ontology collapsed duplicate (s,p,o) keys silently (odoo_ontology.rs:90-104 — HashMap last-write-wins via dn_hash) The module doc said "the extractor de-duplicates" — an unverified assumption. If the harvester ever emits two triples with the same (s, p, o) but different truth values, the second silently overwrites the first. Fix: new test `duplicate_spo_keys_are_last_write_wins` pins the overwrite semantics. A future switch to insertion-rejection or merge becomes a test failure instead of a silent behaviour change. ## Architectural disclaimer `OdooMethodKind` (codegen_spine.rs:230) is the bucket *catalogue*; the *classifier* (Rust port of `.claude/odoo/openings_hops.py`) is a follow-up emitter. action_emitter intentionally does NOT carry a `kind` field — the doc now spells out the wiring gap explicitly so the next session doesn't read this PR as "kind is wired" when it isn't. ## Polish - `RouteBucket::id_owned(&self) -> String` default method added (codegen_spine.rs:336-340). Escape hatch for async/iterator pipelines that need an owned id outside the borrow scope. - `impl std::error::Error for WidgetRenderError` (codegen_spine.rs) for ecosystem `?`-propagation compatibility. - `#[serde(deny_unknown_fields)]` on `OntologyTriple` so harvester schema drift fails parsing instead of silently dropping fields. - New test `function_count_matches_module_doc` in odoo_ontology.rs pins the "3 328 Functions" doc claim against drift inside the loader crate (was only asserted by the downstream action_emitter). - `compose_spec` now builds `effects` from the borrowed `effects_set` directly (action_emitter.rs:255-258), eliminating one redundant `idx.emits_by_fn.get(fn_id)` lookup. ## Test counts (orchestrator-verified) - lance-graph-contract codegen_spine: 6 → 7 passed (+1 truth-mangler) - lance-graph graph::spo:: total: 75 → 78 passed (+3 ontology tests) Fixes from PR #432 opus 4.8 reviewer (findings 1-3 must-fix, 5+7 should-discuss accepted, 4 doc-disclaimer accepted, 6+8 deferred, nitpicks 1+2+3 accepted).
diff --git a/crates/lance-graph-contract/src/codegen_spine.rs b/crates/lance-graph-contract/src/codegen_spine.rs
@@ -115,7 +115,9 @@ pub trait TripletProjection {
     }
 
     /// Tolerance for `f`/`c` comparison in `roundtrip_eq`. Default 0.0
-    /// (lossless); override to allow quantised projections.
+    /// (exact equality required); override to allow quantised projections.
+    /// The check is ALWAYS run — `0.0` does NOT skip it; it requires the
+    /// recovered truth value to match the source exactly.
     fn truth_tolerance() -> f32 {
         0.0
     }
@@ -156,24 +158,23 @@ pub fn roundtrip_eq<P: TripletProjection>(input: &[Triple]) -> Result<(), RoundT
         });
     }
 
-    // Truth-value tolerance check.
+    // Truth-value tolerance check — always run; tol = 0.0 means strict
+    // (any difference fails the `abs() > tol` check naturally).
     let tol = P::truth_tolerance();
-    if tol > 0.0 {
-        let in_truth: std::collections::BTreeMap<_, _> =
-            input.iter().map(|t| (t.key(), (t.f, t.c))).collect();
-        for r in &regenerated {
-            if let Some((f0, c0)) = in_truth.get(&r.key()) {
-                if (r.f - f0).abs() > tol || (r.c - c0).abs() > tol {
-                    return Err(RoundTripFailure {
-                        projection: P::name(),
-                        input_count: in_keys.len(),
-                        output_count: out_keys.len(),
-                        missing_count: 0,
-                        extraneous_count: 0,
-                        sample_missing: vec![r.key()],
-                        sample_extraneous: vec![],
-                    });
-                }
+    let in_truth: std::collections::BTreeMap<_, _> =
+        input.iter().map(|t| (t.key(), (t.f, t.c))).collect();
+    for r in &regenerated {
+        if let Some((f0, c0)) = in_truth.get(&r.key()) {
+            if (r.f - f0).abs() > tol || (r.c - c0).abs() > tol {
+                return Err(RoundTripFailure {
+                    projection: P::name(),
+                    input_count: in_keys.len(),
+                    output_count: out_keys.len(),
+                    missing_count: 0,
+                    extraneous_count: 0,
+                    sample_missing: vec![r.key()],
+                    sample_extraneous: vec![],
+                });
             }
         }
     }
@@ -226,6 +227,19 @@ impl fmt::Display for RoundTripFailure {
 /// Static codegen reads it. Askama route SoC reads it. GUI widget templates
 /// read it. Adding a 17th opening = one variant + one `match` arm in every
 /// consumer (compiler-enforced exhaustiveness).
+///
+/// # Classifier wiring is a separate emitter (TBD)
+///
+/// This enum is the *bucket catalogue*. The function that takes a method
+/// body / AST / `ActionSpec` and returns the matching `OdooMethodKind`
+/// lives in a downstream classifier emitter (the Rust port of
+/// `.claude/odoo/openings_hops.py`'s priority cascade). It is intentionally
+/// NOT wired into `lance_graph::graph::spo::action_emitter` yet —
+/// `ActionSpec` carries the structural edges (effects / inputs / raises /
+/// reads / traverses); the kind classification gets bolted on by the
+/// classifier in a follow-up PR. Until then, consumers that need a kind
+/// should resolve it via the priority classifier directly, not by
+/// inspecting `ActionSpec`.
 #[derive(Debug, Clone, Copy, PartialEq, Eq, Hash, PartialOrd, Ord)]
 pub enum OdooMethodKind {
     /// `pass` body — explicit no-op framework override.
@@ -332,6 +346,13 @@ pub trait RouteBucket {
 
     /// Stable identity of this route (e.g. `account.move._compute_amount`).
     fn id(&self) -> &str;
+
+    /// Owned-id escape hatch for async/iterator pipelines that need to
+    /// outlive a `&dyn RouteBucket` borrow. Defaults to cloning `id()`;
+    /// implementors with a pre-allocated owned string can override.
+    fn id_owned(&self) -> String {
+        self.id().to_string()
+    }
 }
 
 // ---------------------------------------------------------------------------
@@ -363,6 +384,8 @@ impl fmt::Display for WidgetRenderError {
     }
 }
 
+impl std::error::Error for WidgetRenderError {}
+
 // ---------------------------------------------------------------------------
 // ④ Genericity — what to codegen vs what to read from the triple store
 // ---------------------------------------------------------------------------
@@ -491,6 +514,51 @@ mod tests {
         }
     }
 
+    /// Identity-preserving but truth-mangling projection — every (s,p,o)
+    /// round-trips, but (f, c) come back as (0.0, 0.0). With the default
+    /// `truth_tolerance() = 0.0`, this MUST fail the roundtrip check.
+    struct TruthMangler;
+
+    impl TripletProjection for TruthMangler {
+        type Const = Vec<(String, String, String)>;
+
+        fn project(triples: &[Triple]) -> Self::Const {
+            triples
+                .iter()
+                .map(|t| (t.s.clone(), t.p.clone(), t.o.clone()))
+                .collect()
+        }
+
+        fn decompile(c: &Self::Const) -> Vec<Triple> {
+            c.iter()
+                .map(|(s, p, o)| Triple {
+                    s: s.clone(),
+                    p: p.clone(),
+                    o: o.clone(),
+                    f: 0.0,
+                    c: 0.0,
+                })
+                .collect()
+        }
+        // No truth_tolerance() override — default 0.0.
+    }
+
+    #[test]
+    fn default_tolerance_requires_exact_truth_match() {
+        let input = fixture();
+        let result = roundtrip_eq::<TruthMangler>(&input);
+        // Default tolerance is 0.0 → must reject any truth mismatch
+        // (input has f=1.0 / 0.95, decompiled has f=0.0).
+        match result {
+            Err(failure) => {
+                assert!(failure.projection.contains("TruthMangler"));
+            }
+            Ok(()) => {
+                panic!("TruthMangler must fail with default tolerance 0.0 (truth values differ)");
+            }
+        }
+    }
+
     #[test]
     fn odoo_method_kind_ids_are_unique_and_stable() {
         let mut seen = BTreeSet::new();
diff --git a/crates/lance-graph/src/graph/spo/action_emitter.rs b/crates/lance-graph/src/graph/spo/action_emitter.rs
@@ -255,7 +255,7 @@ fn compose_spec(fn_id: &str, idx: &TripleIndex) -> ActionSpec {
     ActionSpec {
         id: fn_id.to_string(),
         family,
-        effects: collect_sorted(idx.emits_by_fn.get(fn_id)),
+        effects: effects_set.iter().cloned().collect(),
         inputs: inputs.into_iter().collect(),
         raises: collect_sorted(idx.raises_by_fn.get(fn_id)),
         reads: collect_sorted(idx.reads_by_fn.get(fn_id)),
diff --git a/crates/lance-graph/src/graph/spo/odoo_ontology.rs b/crates/lance-graph/src/graph/spo/odoo_ontology.rs
@@ -52,7 +52,11 @@ use crate::graph::spo::store::SpoStore;
 use crate::graph::spo::truth::TruthValue;
 
 /// One parsed ontology triple line: `{"s","p","o","f","c"}`.
+///
+/// `deny_unknown_fields` so harvester schema drift surfaces as a parse
+/// error instead of silently degrading the truth signal.
 #[derive(Debug, Clone, serde::Deserialize)]
+#[serde(deny_unknown_fields)]
 pub struct OntologyTriple {
     /// Subject IRI (e.g. `odoo:account_move.amount_total`).
     pub s: String,
@@ -167,4 +171,63 @@ mod tests {
         });
         assert!(found, "expected emitted_by edge missing from data file");
     }
+
+    /// Catch silent parse failures: every non-empty line must produce one
+    /// `OntologyTriple`. If a line is corrupt and `filter_map().ok()` drops
+    /// it, this assertion fires — corruption can't sneak through as a
+    /// quiet count mismatch.
+    #[test]
+    fn every_nonempty_line_parses() {
+        let raw_lines = ONTOLOGY.lines().filter(|l| !l.trim().is_empty()).count();
+        let parsed = parse_triples(ONTOLOGY).len();
+        assert_eq!(
+            raw_lines,
+            parsed,
+            "{} of {} ontology lines silently failed to parse",
+            raw_lines - parsed,
+            raw_lines
+        );
+    }
+
+    /// Pin the documented "extractor de-duplicates" assumption: if two
+    /// triples share `(s, p, o)` but differ in truth, the second insert
+    /// overwrites the first (HashMap last-write-wins via `dn_hash`).
+    /// Verifies the silent-overwrite semantics explicitly so a future
+    /// switch to insertion-rejection or merge becomes a test failure
+    /// instead of a silent change.
+    #[test]
+    fn duplicate_spo_keys_are_last_write_wins() {
+        let s = "odoo:test.x";
+        let p = "depends_on";
+        let o = "odoo:test.y";
+        let ndjson = format!(
+            "{{\"s\":\"{s}\",\"p\":\"{p}\",\"o\":\"{o}\",\"f\":0.9,\"c\":0.9}}\n\
+             {{\"s\":\"{s}\",\"p\":\"{p}\",\"o\":\"{o}\",\"f\":0.1,\"c\":0.1}}\n"
+        );
+
+        let store = load_ontology(&ndjson);
+        // Two source triples → one stored record (key collision).
+        assert_eq!(
+            store.len(),
+            1,
+            "duplicate (s,p,o) must collapse to a single store entry"
+        );
+    }
+
+    /// Lock the module-doc claim "3 328 Functions" against drift so the
+    /// downstream `action_emitter::shipped_ontology_produces_expected_function_count`
+    /// (which asserts the same number on its own) can't get out of sync
+    /// with the loader's source-of-truth count.
+    #[test]
+    fn function_count_matches_module_doc() {
+        let triples = parse_triples(ONTOLOGY);
+        let functions = triples
+            .iter()
+            .filter(|t| t.p == "rdf:type" && t.o == "ogit:Function")
+            .count();
+        assert_eq!(
+            functions, 3328,
+            "function count drifted from module-doc claim (3 328)"
+        );
+    }
 }