bernardladenthin
diff --git a/‎spotbugs-exclude.xml‎
Lines changed: 14 additions & 0 deletions b/‎spotbugs-exclude.xml‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎src/main/java/net/ladenthin/llama/ChatMessage.java‎
Lines changed: 1 addition & 1 deletion b/‎src/main/java/net/ladenthin/llama/ChatMessage.java‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/main/java/net/ladenthin/llama/ChatRequest.java‎
Lines changed: 19 additions & 15 deletions b/‎src/main/java/net/ladenthin/llama/ChatRequest.java‎
Lines changed: 19 additions & 15 deletions
diff --git a/‎src/main/java/net/ladenthin/llama/CompletionResult.java‎
Lines changed: 1 addition & 1 deletion b/‎src/main/java/net/ladenthin/llama/CompletionResult.java‎
Lines changed: 1 addition & 1 deletion
@@ -88,6 +88,20 @@ SPDX-License-Identifier: MIT
         </Or>
     </Match>
 
+    <!--
+        Same design-intent rationale as the ModelParameters OCP block above:
+        InferenceParameters.withReasoningFormat(ReasoningFormat) intentionally
+        types its parameter to the specific ReasoningFormat enum rather than
+        the shared CliArg interface. The narrow type is the API contract;
+        widening it would silently accept any CliArg-implementing enum and
+        emit a nonsense JSON value the native code would reject.
+    -->
+    <Match>
+        <Class name="net.ladenthin.llama.InferenceParameters"/>
+        <Bug pattern="OCP_OVERLY_CONCRETE_PARAMETER"/>
+        <Method name="withReasoningFormat"/>
+    </Match>
+
     <!--
         InferenceParameters and ModelParameters are fluent builders whose
         parameters field is a Map<String, String> serving as the CLI / JSON
 
@@ -25,7 +25,7 @@
  * Multimodal turns carry a non-null {@link #getParts()} list of {@link ContentPart}s
  * (text and image references). When parts are present they take precedence over
  * {@link #getContent()} during serialization; the upstream OAI chat path
- * (see {@link InferenceParameters#setMessages(java.util.List)}) emits an array-form
+ * (see {@link InferenceParameters#withMessages(java.util.List)}) emits an array-form
  * {@code content} field that the compiled-in {@code mtmd} pipeline understands.
  * </p>
  *
 
@@ -12,7 +12,7 @@
 import java.util.Collections;
 import java.util.List;
 import java.util.Optional;
-import java.util.function.Consumer;
+import java.util.function.UnaryOperator;
 import lombok.EqualsAndHashCode;
 import lombok.ToString;
 import org.jspecify.annotations.Nullable;
@@ -25,8 +25,12 @@
  *
  * <p>The request carries the conversation messages, optional tool definitions,
  * an optional {@code tool_choice} hint, and an {@link InferenceParameters}
- * customiser applied to the underlying request just before invocation. The
- * type is consumed by {@link LlamaModel#chat(ChatRequest)} and
+ * customiser applied to the underlying request just before invocation. Because
+ * {@link InferenceParameters} is itself immutable, the customiser is a
+ * {@link UnaryOperator} that takes a parameter set and returns the transformed
+ * one — callers chain {@code withX(...)} calls on the input and return the
+ * resulting instance. The type is consumed by
+ * {@link LlamaModel#chat(ChatRequest)} and
  * {@link LlamaModel#chatWithTools(ChatRequest, java.util.Map)}.
  *
  * <p>All instances are <b>immutable</b>: every field is {@code final} and the
@@ -47,7 +51,7 @@
  *         .appendMessage("system", "be terse")
  *         .appendMessage("user", "two plus two?")
  *         .withMaxToolRounds(2)
- *         .withInferenceCustomizer(p -> p.setNPredict(8).setSeed(1));
+ *         .withInferenceCustomizer(p -> p.withNPredict(8).withSeed(1));
  * }</pre>
  *
  * <p>Each call allocates a new {@code ChatRequest}. The cost is intentional:
@@ -58,7 +62,7 @@
  *
  * <p>{@code @EqualsAndHashCode} compares messages, tools, {@code toolChoice},
  * and {@code maxToolRounds} by value. The {@code paramsCustomizer}
- * {@link Consumer} is <b>excluded</b> from equality: lambdas have
+ * {@link UnaryOperator} is <b>excluded</b> from equality: lambdas have
  * compiler-synthesised identity equality which is not value-shaped, so
  * including it would mean two structurally-identical requests with the same
  * customiser source code rarely compare equal — surprising for the typical
@@ -93,7 +97,7 @@ public final class ChatRequest {
     // equality is compiler-synthesised class identity, not value-shaped.
     @ToString.Exclude
     @EqualsAndHashCode.Exclude
-    private final @Nullable Consumer<InferenceParameters> paramsCustomizer;
+    private final @Nullable UnaryOperator<InferenceParameters> paramsCustomizer;
 
     /**
      * All-args constructor. Private because callers should enter via {@link #empty()}
@@ -105,7 +109,7 @@ private ChatRequest(
             List<ToolDefinition> tools,
             @Nullable String toolChoice,
             int maxToolRounds,
-            @Nullable Consumer<InferenceParameters> paramsCustomizer) {
+            @Nullable UnaryOperator<InferenceParameters> paramsCustomizer) {
         this.messages = messages;
         this.tools = tools;
         this.toolChoice = toolChoice;
@@ -212,7 +216,7 @@ public ChatRequest withMaxToolRounds(int newMaxToolRounds) {
      * @param newCustomizer the customiser; {@code null} clears any prior customiser
      * @return a new request with the customiser replaced; this request is unchanged
      */
-    public ChatRequest withInferenceCustomizer(@Nullable Consumer<InferenceParameters> newCustomizer) {
+    public ChatRequest withInferenceCustomizer(@Nullable UnaryOperator<InferenceParameters> newCustomizer) {
         return new ChatRequest(messages, tools, toolChoice, maxToolRounds, newCustomizer);
     }
 
@@ -319,14 +323,14 @@ public Optional<String> buildToolsJson() {
     }
 
     /**
-     * Apply the optional customiser to an {@link InferenceParameters} instance.
-     * Package-private; called by {@link LlamaModel}.
+     * Apply the optional customiser to an {@link InferenceParameters} instance and
+     * return the transformed result. Package-private; called by {@link LlamaModel}.
+     * When no customiser is set, returns {@code params} unchanged.
      *
-     * @param params the parameters to mutate
+     * @param params the parameters to transform
+     * @return the (possibly new) parameters produced by the customiser, or {@code params} when no customiser is set
      */
-    void applyCustomizer(InferenceParameters params) {
-        if (paramsCustomizer != null) {
-            paramsCustomizer.accept(params);
-        }
+    InferenceParameters applyCustomizer(InferenceParameters params) {
+        return paramsCustomizer == null ? params : paramsCustomizer.apply(params);
     }
 }
@@ -13,7 +13,7 @@
  * <p>
  * Bundles the generated text with parsed {@link Usage}, {@link Timings},
  * per-token {@link TokenLogprob} entries (populated only when
- * {@link InferenceParameters#setNProbs(int)} &gt; 0), and the {@link StopReason}.
+ * {@link InferenceParameters#withNProbs(int)} &gt; 0), and the {@link StopReason}.
  * The raw native JSON is exposed via {@link #getRawJson()} as an escape hatch.
  * </p>
  *
Original file line number	Diff line number	Diff line change
`@@ -25,7 +25,7 @@`
`25`	`25`	`* Multimodal turns carry a non-null {@link #getParts()} list of {@link ContentPart}s`
`26`	`26`	`* (text and image references). When parts are present they take precedence over`
`27`	`27`	`* {@link #getContent()} during serialization; the upstream OAI chat path`
`28`		`- * (see {@link InferenceParameters#setMessages(java.util.List)}) emits an array-form`
	`28`	`+ * (see {@link InferenceParameters#withMessages(java.util.List)}) emits an array-form`
`29`	`29`	`* {@code content} field that the compiled-in {@code mtmd} pipeline understands.`
`30`	`30`	`* </p>`
`31`	`31`	`*`
Original file line number	Diff line number	Diff line change
`@@ -13,7 +13,7 @@`
`13`	`13`	`* <p>`
`14`	`14`	`* Bundles the generated text with parsed {@link Usage}, {@link Timings},`
`15`	`15`	`* per-token {@link TokenLogprob} entries (populated only when`
`16`		`- * {@link InferenceParameters#setNProbs(int)} > 0), and the {@link StopReason}.`
	`16`	`+ * {@link InferenceParameters#withNProbs(int)} > 0), and the {@link StopReason}.`
`17`	`17`	`* The raw native JSON is exposed via {@link #getRawJson()} as an escape hatch.`
`18`	`18`	`* </p>`
`19`	`19`	`*`