moonbit-community
diff --git a/‎README.mbt.md‎
Lines changed: 9 additions & 3 deletions b/‎README.mbt.md‎
Lines changed: 9 additions & 3 deletions
diff --git a/‎events.mbt‎
Lines changed: 3 additions & 1 deletion b/‎events.mbt‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎events_test.mbt‎
Lines changed: 280 additions & 0 deletions b/‎events_test.mbt‎
Lines changed: 280 additions & 0 deletions
diff --git a/‎exec.mbt‎
Lines changed: 1 addition & 1 deletion b/‎exec.mbt‎
Lines changed: 1 addition & 1 deletion
@@ -3,12 +3,12 @@
 This is the Codex SDK for MoonBit, ported from the TypeScript SDK.
 
 The SDK communicates with Codex by spawning it in non-interactive mode using
-`codex exec`. The target Codex version is 0.79.0.
+`codex exec`. The target Codex version is `codex-cli 0.128.0`.
 
 Codex must be installed and available on your PATH. If not, install with:
 
 ```bash
-pnpm install -g @openai/codex@0.79.0
+pnpm install -g @openai/codex@0.128.0
 ```
 
 ## Usage
@@ -81,7 +81,7 @@ async test {
 
 The MoonBit SDK is a thin but strongly typed wrapper around `codex exec`:
 
-1. `@codex.CodexExec::run` spawns the CLI with `--experimental-json`,
+1. `@codex.CodexExec::run` spawns the CLI with `--json`,
    automatically wiring API endpoint overrides, API keys, sandbox flags, working
    directory overrides, and thread resumption arguments.
 2. The CLI's JSONL stream is fed through `@generator.AsyncGenerator` so the SDK
@@ -91,6 +91,12 @@ The MoonBit SDK is a thin but strongly typed wrapper around `codex exec`:
    hierarchy (`events.mbt` and `items.mbt`), which means MoonBit callers never
    manipulate raw JSON.
 
+The native JSON event parser targets the `codex-cli 0.128.0` non-interactive
+event stream, checked against the upstream `openai/codex` schema at
+`2a67c46de498`. In that schema, command execution items always include
+`aggregated_output` as a string; in-progress commands use an empty string until
+terminal output is available.
+
 The `Codex`/`Thread`/`Turn` trio mirrors the CLI lifecycle: a `Codex` holds
 process-level configuration, a `Thread` models a Codex conversation, and a
 `Turn` captures the completed response plus token usage metrics.
 
@@ -126,7 +126,9 @@ pub struct Usage {
   cached_input_tokens : Int
   /// The number of output tokens used during the turn
   output_tokens : Int
-} derive(ToJson, @json.FromJson)
+  /// The number of reasoning output tokens used during the turn
+  reasoning_output_tokens : Int
+} derive(ToJson, @json.FromJson, Debug)
 
 ///|
 pub struct ThreadError {
 
@@ -0,0 +1,280 @@
+///|
+test "parse started command execution with empty output" {
+  let event : Event = @json.from_json(
+    @json.parse(
+      (
+        #|{
+        #|  "type": "item.started",
+        #|  "item": {
+        #|    "id": "cmd-1",
+        #|    "type": "command_execution",
+        #|    "command": "pwd",
+        #|    "aggregated_output": "",
+        #|    "status": "in_progress"
+        #|  }
+        #|}
+      ),
+    ),
+  )
+  match event {
+    ItemStarted(
+      CommandExecutionItem(
+        id~,
+        command~,
+        aggregated_output~,
+        exit_code~,
+        status~
+      )
+    ) => {
+      debug_inspect(
+        id,
+        content=(
+          #|"cmd-1"
+        ),
+      )
+      debug_inspect(
+        command,
+        content=(
+          #|"pwd"
+        ),
+      )
+      debug_inspect(
+        aggregated_output,
+        content=(
+          #|""
+        ),
+      )
+      debug_inspect(exit_code, content="None")
+      guard status is InProgress else {
+        fail("expected in-progress command execution")
+      }
+    }
+    _ => fail("expected started command execution")
+  }
+}
+
+///|
+test "parse declined command execution" {
+  let event : Event = @json.from_json(
+    @json.parse(
+      (
+        #|{
+        #|  "type": "item.completed",
+        #|  "item": {
+        #|    "id": "cmd-1",
+        #|    "type": "command_execution",
+        #|    "command": "pwd",
+        #|    "aggregated_output": "",
+        #|    "status": "declined"
+        #|  }
+        #|}
+      ),
+    ),
+  )
+  match event {
+    ItemCompleted(CommandExecutionItem(status~, exit_code~, ..)) => {
+      guard status is Declined else {
+        fail("expected declined command execution")
+      }
+      debug_inspect(exit_code, content="None")
+    }
+    _ => fail("expected completed command execution")
+  }
+}
+
+///|
+test "parse completed collab tool call" {
+  let event : Event = @json.from_json(
+    @json.parse(
+      (
+        #|{
+        #|  "type": "item.completed",
+        #|  "item": {
+        #|    "id": "collab-1",
+        #|    "type": "collab_tool_call",
+        #|    "tool": "spawn_agent",
+        #|    "sender_thread_id": "thread-parent",
+        #|    "receiver_thread_ids": ["thread-child"],
+        #|    "prompt": "draft a plan",
+        #|    "agents_states": {
+        #|      "thread-child": {
+        #|        "status": "running",
+        #|        "message": null
+        #|      }
+        #|    },
+        #|    "status": "completed"
+        #|  }
+        #|}
+      ),
+    ),
+  )
+  match event {
+    ItemCompleted(
+      CollabToolCallItem(
+        tool~,
+        sender_thread_id~,
+        receiver_thread_ids~,
+        prompt~,
+        status~,
+        ..
+      )
+    ) => {
+      guard tool is SpawnAgent else { fail("expected spawn_agent collab tool") }
+      guard status is Completed else {
+        fail("expected completed collab tool call")
+      }
+      debug_inspect(
+        sender_thread_id,
+        content=(
+          #|"thread-parent"
+        ),
+      )
+      debug_inspect(
+        receiver_thread_ids,
+        content=(
+          #|["thread-child"]
+        ),
+      )
+      debug_inspect(
+        prompt,
+        content=(
+          #|Some("draft a plan")
+        ),
+      )
+    }
+    _ => fail("expected completed collab tool call")
+  }
+}
+
+///|
+test "parse in-progress file change" {
+  let event : Event = @json.from_json(
+    @json.parse(
+      (
+        #|{
+        #|  "type": "item.started",
+        #|  "item": {
+        #|    "id": "patch-1",
+        #|    "type": "file_change",
+        #|    "changes": [
+        #|      { "path": "README.md", "kind": "update" }
+        #|    ],
+        #|    "status": "in_progress"
+        #|  }
+        #|}
+      ),
+    ),
+  )
+  match event {
+    ItemStarted(FileChangeItem(status~, changes~, ..)) => {
+      guard status is InProgress else {
+        fail("expected in-progress file change")
+      }
+      debug_inspect(
+        changes.length(),
+        content=(
+          #|1
+        ),
+      )
+    }
+    _ => fail("expected started file change")
+  }
+}
+
+///|
+test "parse in-progress mcp tool call with null result and error" {
+  let event : Event = @json.from_json(
+    @json.parse(
+      (
+        #|{
+        #|  "type": "item.started",
+        #|  "item": {
+        #|    "id": "mcp-1",
+        #|    "type": "mcp_tool_call",
+        #|    "server": "docs",
+        #|    "tool": "search",
+        #|    "arguments": { "query": "codex" },
+        #|    "result": null,
+        #|    "error": null,
+        #|    "status": "in_progress"
+        #|  }
+        #|}
+      ),
+    ),
+  )
+  match event {
+    ItemStarted(McpToolCallItem(result~, status~, ..)) => {
+      guard status is InProgress else {
+        fail("expected in-progress MCP tool call")
+      }
+      guard result is None else { fail("expected no MCP result") }
+    }
+    _ => fail("expected started MCP tool call")
+  }
+}
+
+///|
+test "parse turn completed usage with reasoning tokens" {
+  let event : Event = @json.from_json(
+    @json.parse(
+      (
+        #|{
+        #|  "type": "turn.completed",
+        #|  "usage": {
+        #|    "input_tokens": 10,
+        #|    "cached_input_tokens": 3,
+        #|    "output_tokens": 7,
+        #|    "reasoning_output_tokens": 5
+        #|  }
+        #|}
+      ),
+    ),
+  )
+  match event {
+    TurnCompleted(usage) =>
+      debug_inspect(
+        usage,
+        content=(
+          #|{
+          #|  input_tokens: 10,
+          #|  cached_input_tokens: 3,
+          #|  output_tokens: 7,
+          #|  reasoning_output_tokens: 5,
+          #|}
+        ),
+      )
+    _ => fail("expected turn completed event")
+  }
+}
+
+///|
+test "parse failed mcp tool call with null result" {
+  let event : Event = @json.from_json(
+    @json.parse(
+      (
+        #|{
+        #|  "type": "item.completed",
+        #|  "item": {
+        #|    "id": "mcp-1",
+        #|    "type": "mcp_tool_call",
+        #|    "server": "docs",
+        #|    "tool": "search",
+        #|    "arguments": { "query": "codex" },
+        #|    "result": null,
+        #|    "error": { "message": "permission denied" },
+        #|    "status": "failed"
+        #|  }
+        #|}
+      ),
+    ),
+  )
+  match event {
+    ItemCompleted(McpToolCallItem(result~, status~, ..)) => {
+      guard status is Failed else { fail("expected failed MCP tool call") }
+      guard result is Some(Err("permission denied")) else {
+        fail("expected MCP error result")
+      }
+    }
+    _ => fail("expected completed MCP tool call")
+  }
+}
@@ -68,7 +68,7 @@ async fn[T] CodexExec::run(
   taskgroup : @async.TaskGroup[T],
 ) -> @generator.AsyncGenerator[String] {
   // Build command arguments
-  let command_args : Array[String] = ["exec", "--experimental-json"]
+  let command_args : Array[String] = ["exec", "--json"]
 
   // Add optional arguments
   if args.thread_options.model is Some(model) {