You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: docs/openapi.json
+28Lines changed: 28 additions & 0 deletions
Original file line number
Diff line number
Diff line change
@@ -13614,6 +13614,34 @@
13614
13614
"type": "array",
13615
13615
"title": "High-level inference providers",
13616
13616
"description": "Unified-mode synthesis input (Decision S5): a high-level, backend-agnostic list of inference providers the synthesizer expands into Llama Stack provider entries. Lives at the configuration root so it survives a future backend change. A non-empty list signals unified mode. Empty (the default) leaves legacy/remote modes unaffected. The sibling default_model / default_provider keep their query-time routing meaning and are independent of this list."
13617
+
},
13618
+
"max_infer_iters": {
13619
+
"anyOf": [
13620
+
{
13621
+
"type": "integer",
13622
+
"exclusiveMinimum": 0.0
13623
+
},
13624
+
{
13625
+
"type": "null"
13626
+
}
13627
+
],
13628
+
"title": "Default max inference iterations",
13629
+
"description": "Server-side default for the maximum number of inference iterations a model can perform in a single request. Prevents small models from looping indefinitely on tool calls. Per-request values take precedence over this default. Set to None to disable the limit.",
13630
+
"default": 10
13631
+
},
13632
+
"max_tool_calls": {
13633
+
"anyOf": [
13634
+
{
13635
+
"type": "integer",
13636
+
"exclusiveMinimum": 0.0
13637
+
},
13638
+
{
13639
+
"type": "null"
13640
+
}
13641
+
],
13642
+
"title": "Default max tool calls",
13643
+
"description": "Server-side default for the maximum number of tool calls allowed in a single response. Prevents small models from exhausting the context window with repeated tool calls. Per-request values take precedence over this default. Set to None to disable the limit.",
0 commit comments