Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
8 changes: 6 additions & 2 deletions packages/llm/src/protocols/openai-chat.ts
Original file line number Diff line number Diff line change
Expand Up @@ -145,6 +145,10 @@ type OpenAIChatToolCallDelta = Schema.Schema.Type<typeof OpenAIChatToolCallDelta
const OpenAIChatDelta = Schema.Struct({
content: optionalNull(Schema.String),
reasoning_content: optionalNull(Schema.String),
// Some OpenAI-compatible providers (Scaleway, vLLM/SGLang, OpenRouter, ...)
// stream reasoning under `reasoning` rather than `reasoning_content`. Accept
// both so their thinking is not silently dropped.
reasoning: optionalNull(Schema.String),
tool_calls: optionalNull(Schema.Array(OpenAIChatToolCallDelta)),
})

Expand Down Expand Up @@ -416,8 +420,8 @@ const step = (state: ParserState, event: OpenAIChatEvent) =>

let lifecycle = state.lifecycle

if (delta?.reasoning_content)
lifecycle = Lifecycle.reasoningDelta(lifecycle, events, "reasoning-0", delta.reasoning_content)
const reasoningText = delta?.reasoning_content ?? delta?.reasoning
if (reasoningText) lifecycle = Lifecycle.reasoningDelta(lifecycle, events, "reasoning-0", reasoningText)

if (delta?.content) {
lifecycle = Lifecycle.reasoningEnd(lifecycle, events, "reasoning-0")
Expand Down
41 changes: 41 additions & 0 deletions packages/llm/test/provider/openai-chat.test.ts
Original file line number Diff line number Diff line change
Expand Up @@ -552,6 +552,47 @@ describe("OpenAI Chat route", () => {
}),
)

it.effect("parses OpenAI-compatible reasoning deltas from the `reasoning` field", () =>
Effect.gen(function* () {
const body = sseEvents(
{ choices: [{ delta: { reasoning: "thinking" } }] },
{ choices: [{ delta: { content: "Hello" } }] },
{ choices: [{ delta: {}, finish_reason: "stop" }] },
)

const response = yield* LLMClient.generate(request).pipe(Effect.provide(fixedResponse(body)))

expect(response.reasoning).toBe("thinking")
expect(response.text).toBe("Hello")
expect(response.events).toMatchObject([
{ type: "step-start", index: 0 },
{ type: "reasoning-start", id: "reasoning-0" },
{ type: "reasoning-delta", id: "reasoning-0", text: "thinking" },
{ type: "reasoning-end", id: "reasoning-0" },
{ type: "text-start", id: "text-0" },
{ type: "text-delta", id: "text-0", text: "Hello" },
{ type: "text-end", id: "text-0" },
{ type: "step-finish", index: 0, reason: "stop" },
{ type: "finish", reason: "stop" },
])
}),
)

it.effect("prefers reasoning_content when both reasoning fields are present", () =>
Effect.gen(function* () {
const body = sseEvents(
{ choices: [{ delta: { reasoning_content: "canonical", reasoning: "duplicate" } }] },
{ choices: [{ delta: { content: "Hello" } }] },
{ choices: [{ delta: {}, finish_reason: "stop" }] },
)

const response = yield* LLMClient.generate(request).pipe(Effect.provide(fixedResponse(body)))

expect(response.reasoning).toBe("canonical")
expect(response.text).toBe("Hello")
}),
)

it.effect("assembles streamed tool call input", () =>
Effect.gen(function* () {
const body = sseEvents(
Expand Down
Loading