gitbutlerapp
diff --git a/‎apps/web/src/routes/cli/scripts.json‎
Lines changed: 4 additions & 4 deletions b/‎apps/web/src/routes/cli/scripts.json‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎crates/but-agentlog/skill/SKILL.md‎
Lines changed: 5 additions & 5 deletions b/‎crates/but-agentlog/skill/SKILL.md‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎crates/but-agentlog/skill/agents/openai.yaml‎
Lines changed: 1 addition & 1 deletion b/‎crates/but-agentlog/skill/agents/openai.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎crates/but-agentlog/src/cli.rs‎
Lines changed: 1 addition & 1 deletion b/‎crates/but-agentlog/src/cli.rs‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎crates/but-agentlog/src/skim.rs‎
Lines changed: 7 additions & 5 deletions b/‎crates/but-agentlog/src/skim.rs‎
Lines changed: 7 additions & 5 deletions
diff --git a/‎crates/but/skill/RESEARCH.md‎
Lines changed: 25 additions & 25 deletions b/‎crates/but/skill/RESEARCH.md‎
Lines changed: 25 additions & 25 deletions
diff --git a/‎crates/but/skill/references/reference.md‎
Lines changed: 1 addition & 1 deletion b/‎crates/but/skill/references/reference.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎crates/but/src/args/mod.rs‎
Lines changed: 25 additions & 18 deletions b/‎crates/but/src/args/mod.rs‎
Lines changed: 25 additions & 18 deletions
diff --git a/‎crates/but/src/args/tests.rs‎
Lines changed: 3 additions & 2 deletions b/‎crates/but/src/args/tests.rs‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎crates/but/src/args/tests/reword.rs‎
Lines changed: 12 additions & 0 deletions b/‎crates/but/src/args/tests/reword.rs‎
Lines changed: 12 additions & 0 deletions
@@ -230,11 +230,11 @@
 		"script": [
 			{
 				"type": "input",
-				"lines": ["# Everything takes --json"]
+				"lines": ["# Everything takes --format json"]
 			},
 			{
 				"type": "input",
-				"lines": ["$ but --json branch new feature/ai-integration | jq ."]
+				"lines": ["$ but --format json branch new feature/ai-integration | jq ."]
 			},
 			{
 				"type": "output",
@@ -247,7 +247,7 @@
 			},
 			{
 				"type": "input",
-				"lines": ["$ but show -j 90fe | jq ."]
+				"lines": ["$ but show --format json 90fe | jq ."]
 			},
 			{
 				"type": "output",
@@ -265,7 +265,7 @@
 			},
 			{
 				"type": "input",
-				"lines": ["$ but --json status | jq '.stacks[].branches[].commits[]'"]
+				"lines": ["$ but --format json status | jq '.stacks[].branches[].commits[]'"]
 			},
 			{
 				"type": "output",
 
@@ -54,7 +54,7 @@ Pass an explicit target only when the user gives one.
 Use JSON only when you need exact handles for drill-down:
 
 ```sh
-but --json agentlog skim
+but --format json agentlog skim
 ```
 
 1. Start with `skim` for a clean orientation.
@@ -63,8 +63,8 @@ but --json agentlog skim
 3. If `skim` is enough for a lightweight status answer, summarize it and stop.
 4. Drill down only when `skim` is ambiguous, misses the rationale, or you need
    exact evidence.
-5. To drill down, rerun `skim` with `--json` to get the relevant `session_key`
-   and `turn_key`, then use `show`.
+5. To drill down, rerun `skim` with `--format json` to get the relevant
+   `session_key` and `turn_key`, then use `show`.
 6. Use `show <session-key>` for turn-level context.
 7. Use `show <session-key> --turn <turn-key>` only for turns that need exact detail.
 
@@ -91,8 +91,8 @@ Do not use plain Git's `gitbutler/workspace` branch as an agentlog target.
 - Prefer `skim` for turn-history recovery.
 - Treat `skim` as complete but abbreviated. It includes every related session
   and every turn in those sessions, not every record or the full transcript.
-- Prefer human `skim` output first. Use `--json` only for drill-down handles
-  or exact evidence.
+- Prefer human `skim` output first. Use `--format json` only for drill-down
+  handles or exact evidence.
 - Run `show` when `skim` is thin, ambiguous, missing the why, or when the user
   is asking you to make or verify a consequential claim.
 - Do not dump records for every candidate session.
 
@@ -1,4 +1,4 @@
 interface:
   display_name: "But Agentlog"
   short_description: "Get context for a GitButler branch from prior agent work"
-  default_prompt: "Use $but-agentlog for requests like \"get context for branch\", \"catch up on this branch\", or \"recover branch context\". Do not start with generic git branch/diff inspection; run `but agentlog skim` first. Use `but --json agentlog skim` plus `but agentlog show` only if exact drill-down is needed."
+  default_prompt: "Use $but-agentlog for requests like \"get context for branch\", \"catch up on this branch\", or \"recover branch context\". Do not start with generic git branch/diff inspection; run `but agentlog skim` first. Use `but --format json agentlog skim` plus `but agentlog show` only if exact drill-down is needed."
@@ -33,7 +33,7 @@ pub enum Command {
     /// Show a session, or one turn in detail.
     #[clap(name = "show")]
     Show {
-        /// Session key from `skim --json`.
+        /// Session key from `skim --format json`.
         #[clap(value_name = "SESSION", value_parser = non_empty_value)]
         session_key: String,
         /// Show detailed records for this turn key.
 
@@ -346,16 +346,18 @@ fn applied_gitbutler_branch(workdir: &Path) -> anyhow::Result<String> {
     let output = ProcessCommand::new(&but_path)
         .arg("-C")
         .arg(workdir)
-        .args(["--json", "status"])
+        .args(["--format", "json", "status"])
         .stdin(Stdio::null())
         .output()
-        .context("failed to run 'but --json status' for agentlog skim target discovery")?;
+        .context("failed to run 'but --format json status' for agentlog skim target discovery")?;
     if !output.status.success() {
         let stderr = String::from_utf8_lossy(&output.stderr);
-        anyhow::bail!("failed to discover GitButler branch with 'but --json status': {stderr}");
+        anyhow::bail!(
+            "failed to discover GitButler branch with 'but --format json status': {stderr}"
+        );
     }
-    let status: StatusReport =
-        serde_json::from_slice(&output.stdout).context("failed to parse 'but --json status'")?;
+    let status: StatusReport = serde_json::from_slice(&output.stdout)
+        .context("failed to parse 'but --format json status'")?;
     status
         .stacks
         .into_iter()
 
@@ -52,9 +52,9 @@ Evaluation structure they suggest:
   "query": "Commit the auth changes to the feature branch",
   "files": ["src/auth.rs"],
   "expected_behavior": [
-    "Runs but status --json to check workspace state",
+    "Runs but status --format json to check workspace state",
     "Uses but commit with --changes flag for specific files",
-    "Includes --json and --status-after flags"
+    "Includes --format json and --status-after flags"
   ]
 }
 ```
@@ -101,7 +101,7 @@ tests:
       - type: javascript
         value: |
           const text = String(output).toLowerCase();
-          return text.includes('--json') && text.includes('--status-after');
+          return text.includes('--format json') && text.includes('--status-after');
 ```
 
 ## Metrics That Matter
@@ -113,10 +113,10 @@ Based on industry standards and our specific skill file, here are the metrics to
 | Metric | What It Measures | Target | How to Score |
 |--------|-----------------|--------|-------------|
 | **Tool routing accuracy** | Uses `but` instead of `git` for write ops | 100% | Binary per command |
-| **`--json` compliance** | All `but` commands include `--json` | 100% | Count across all commands in response |
+| **`--format json` compliance** | All `but` commands include `--format json` | 100% | Count across all commands in response |
 | **`--status-after` compliance** | Mutation commands include `--status-after` | 100% | Check commit/absorb/rub/stage/squash/move/uncommit |
 | **`--changes` specificity** | `but commit` uses `--changes` with explicit IDs (`a1,b2` or repeated flag), not bare commit | >90% | Binary per commit command |
-| **Workflow ordering** | Runs `but status --json` before mutations | 100% | Check command sequence |
+| **Workflow ordering** | Runs `but status --format json` before mutations | 100% | Check command sequence |
 | **Unnecessary round-trips** | No `but status` after commands with `--status-after` | 0 | Count redundant status calls |
 | **Task completion** | End-to-end task succeeds | >80% | Binary per scenario |
 
@@ -149,7 +149,7 @@ Validate skill file structure without calling any LLM. Run as part of `cargo tes
 **What to check:**
 - YAML frontmatter is valid and meets Anthropic's constraints (name <=64 chars, description <=1024 chars)
 - All referenced files exist (`references/reference.md`, etc.)
-- Code examples are internally consistent (every mutation command example includes `--json --status-after`)
+- Code examples are internally consistent (every mutation command example includes `--format json --status-after`)
 - No contradictions between SKILL.md and reference files
 - Translation table covers all commands mentioned in reference.md
 - Line count stays under 250 (our budget)
@@ -171,13 +171,13 @@ Score: Does the tool call match expectations?
 
 | User Prompt | Expected First Command | Assertions |
 |------------|----------------------|------------|
-| "What files have I changed?" | `but status --json` | contains `but status`, contains `--json` |
-| "Commit my auth changes" | `but status --json` | status first, then commit with `--changes` |
+| "What files have I changed?" | `but status --format json` | contains `but status`, contains `--format json` |
+| "Commit my auth changes" | `but status --format json` | status first, then commit with `--changes` |
 | "Create a new branch for auth" | `but branch new auth` | contains `but branch new` |
 | "Push my changes" | `but push` | NOT `git push` |
 | "Squash my last 3 commits" | `but squash` | NOT `git rebase -i` |
 | "Can you do a git push?" | `but push` | uses `but` not `git` |
-| "Check what's changed" | `but status --json` | NOT `git status`, NOT `git diff` |
+| "Check what's changed" | `but status --format json` | NOT `git status`, NOT `git diff` |
 | "Undo my last commit" | some `but` command | NOT `git reset` |
 
 **Implementation options:**
@@ -206,23 +206,23 @@ Test complete workflows with mock tool execution. This is the highest-signal tie
 ```
 User: "I just finished implementing auth. Commit it."
 Expected sequence:
-  1. but status --json           (check state)
-  2. but commit <branch> -m "..." --changes <id>,<id> --json --status-after  (commit)
+  1. but status --format json           (check state)
+  2. but commit <branch> -m "..." --changes <id>,<id> --format json --status-after  (commit)
 Assertions:
   - Step 1 happens before step 2
   - Commit includes --changes (not bare commit)
-  - Commit includes --json --status-after
+  - Commit includes --format json --status-after
   - No git commands used
 ```
 
 **Scenario: New feature workflow**
 ```
 User: "Add a dark mode feature"
 Expected sequence:
-  1. but status --json           (check state)
+  1. but status --format json           (check state)
   2. but branch new dark-mode    (create branch)
   3. [file edits happen]
-  4. but commit ... --changes ... --json --status-after
+  4. but commit ... --changes ... --format json --status-after
 Assertions:
   - Branch created before any commits
   - Commit targets the new branch
@@ -243,7 +243,7 @@ The key insight from the research: you don't need to run real commands. Mock the
 
 ```python
 def mock_bash(command: str) -> str:
-    if "but status --json" in command:
+    if "but status --format json" in command:
         return json.dumps({
             "unassignedChanges": [
                 {"cliId": "a1", "filePath": "src/auth.rs", "changeType": "modified"}
@@ -261,20 +261,20 @@ This gives full control, deterministic scoring, and low cost (can use Sonnet/Hai
 
 #### Tier 3 Implementation Notes
 
-**Key insight: Tier 3 tests the skill file, not the `but` CLI.** No `but` binary runs. No git repo exists. The mock handlers return canned JSON that looks like `but status --json` output. You're measuring whether SKILL.md *teaches the model correctly* — complementary to Tier 1's structural validation.
+**Key insight: Tier 3 tests the skill file, not the `but` CLI.** No `but` binary runs. No git repo exists. The mock handlers return canned JSON that looks like `but status --format json` output. You're measuring whether SKILL.md *teaches the model correctly* — complementary to Tier 1's structural validation.
 
 ```
                     ┌─────────────┐
   SKILL.md ───────► │  LLM (API)  │ ◄──── user prompt
   (system context)  └──────┬──────┘
                            │
-                      tool_use: "but status --json"
+                      tool_use: "but status --format json"
                            │
                     ┌──────▼──────┐
                     │ Mock handler │ ──► canned JSON
                     └──────┬──────┘
                            │
-                      tool_use: "but commit ... --changes a1 --json --status-after"
+                      tool_use: "but commit ... --changes a1 --format json --status-after"
                            │
                     Score: did the command sequence follow SKILL.md rules?
 ```
@@ -285,13 +285,13 @@ Tier 3 remains useful for cheap, deterministic diagnostics, but this project gat
 
 | # | Scenario | Key assertions |
 |---|----------|----------------|
-| 1 | Basic commit flow | `status --json` before `commit`; commit has `--changes`, `--json`, `--status-after`; no git write commands |
+| 1 | Basic commit flow | `status --format json` before `commit`; commit has `--changes`, `--format json`, `--status-after`; no git write commands |
 | 2 | Branch workflow | Create branch (`but branch new` or `but commit <branch> -c`) before committing |
 | 3 | Git synonym redirect | User says "git push", model uses `but push` and not `git push` |
-| 4 | Ordering flow | `but status --json` occurs before `but commit` |
+| 4 | Ordering flow | `but status --format json` occurs before `but commit` |
 | 5 | Specificity flow | Single-file commit uses `--changes`; non-target file remains unassigned in repo state |
-| 6 | Amend flow | Use `but amend` with `--json --status-after`; no git write fallback |
-| 7 | Reorder flow | Use `but move`/`but rub` with `--json --status-after`; no `git rebase`/checkout fallback; repo reflects target order |
+| 6 | Amend flow | Use `but amend` with `--format json --status-after`; no git write fallback |
+| 7 | Reorder flow | Use `but move`/`but rub` with `--format json --status-after`; no `git rebase`/checkout fallback; repo reflects target order |
 
 ### Tier 4: Integration (High-cost, realistic)
 
@@ -304,7 +304,7 @@ Run Claude Code against a real test repository with the latest `but` binary and
 | Runs `but` binary | No | Yes — freshly built from source |
 | Real git repo | No | Yes — disposable fixture |
 | Command trace | From mock loop | From SDK hooks or output parsing |
-| Asserts on repo state | No | Yes — `but status --json` after |
+| Asserts on repo state | No | Yes — `but status --format json` after |
 | Cost per scenario | ~$0.02 | ~$0.10-0.50 |
 | Speed | ~5 sec | ~30-120 sec |
 | Catches real bugs | Skill file only | Skill + CLI interaction |
@@ -361,7 +361,7 @@ Running the real Tier 4 harness surfaced a few practical issues that are not obv
    - Fix: normalize fixture path with `pwd -P` in `setup-fixture.sh`.
 
 4. **Keep fixture support files out of Git status.**
-   - `.but-data/` and installed `.claude/skills/` content polluted `but status --json` and changed CLI IDs.
+   - `.but-data/` and installed `.claude/skills/` content polluted `but status --format json` and changed CLI IDs.
    - Fix: add `.but-data/`, `.claude/`, `.tmp/` to `.git/info/exclude` in each fixture.
 
 5. **Fixture cleanup should be best-effort.**
@@ -398,7 +398,7 @@ For **Tier 3** (mock tool execution), Rust is viable since it just calls the Ant
 1. **Keep Tier 4 as the default evaluator** for skill changes.
 2. **Treat a 7-scenario Tier 4 smoke run (`--repeat 1`) as the PR gate** for changes under `crates/but/skill/`.
 3. **Run repeated Tier 4 (`--repeat 3+`) nightly or pre-release** to catch stochastic regressions.
-4. **Track the key Tier 4 metrics over time**: pass rate, git-command leakage rate, `--json` and `--status-after` compliance, and cost per scenario.
+4. **Track the key Tier 4 metrics over time**: pass rate, git-command leakage rate, `--format json` and `--status-after` compliance, and cost per scenario.
 
 ### Supplemental Layers (Optional)
 
 
@@ -325,7 +325,7 @@ Reword commit message or rename branch.
 ```bash
 but reword <id>               # Interactive editor
 but reword <id> -m "new"      # Non-interactive
-but reword <id> --format      # Format to 72-char wrapping
+but reword <id> --fix-formatting  # Format to 72-char wrapping
 ```
 
 ### `but discard <id>`
 
@@ -36,20 +36,8 @@ pub struct Args {
     /// Run as if but was started in PATH instead of the current working directory.
     #[clap(short = 'C', long, default_value = ".", value_name = "PATH")]
     pub current_dir: PathBuf,
-    /// Explicitly control how output should be formatted.
-    ///
-    /// If unset and from a terminal, it defaults to human output, when redirected it's for shells.
-    #[clap(
-        long,
-        short = 'f',
-        env = "BUT_OUTPUT_FORMAT",
-        conflicts_with = "json",
-        default_value = "human"
-    )]
-    pub format: OutputFormat,
-    /// Whether to use JSON output format.
-    #[clap(long, short = 'j', global = true)]
-    pub json: bool,
+    #[clap(flatten)]
+    pub format: OutputFormatArg,
     /// Whether mutation commands should append workspace status.
     #[clap(skip)]
     pub status_after: bool,
@@ -66,6 +54,20 @@ pub struct Args {
     pub cmd: Option<Subcommands>,
 }
 
+#[derive(Debug, clap::Args)]
+pub struct OutputFormatArg {
+    /// Explicitly control how output should be formatted.
+    ///
+    /// If unset and from a terminal, it defaults to human output, when redirected it's for shells.
+    #[clap(
+        long,
+        env = "BUT_OUTPUT_FORMAT",
+        default_value = "human",
+        global = true
+    )]
+    pub format: OutputFormat,
+}
+
 /// How we should format anything written to [`std::io::stdout()`].
 #[derive(Debug, Copy, Clone, clap::ValueEnum, Default)]
 pub enum OutputFormat {
@@ -573,19 +575,24 @@ pub enum Subcommands {
         /// Commit ID to edit the message for, or branch ID to rename
         target: CliIdArg,
         /// The new commit message or branch name. If not provided, opens an editor.
-        #[clap(short = 'm', long = "message", conflicts_with = "format")]
+        #[clap(short = 'm', long = "message", conflicts_with = "fix_formatting")]
         message: Option<String>,
         /// Format the existing commit message to 72-char line wrapping without opening an editor
-        #[clap(short = 'f', long = "format", conflicts_with = "message")]
+        #[clap(
+            id = "fix_formatting",
+            short = 'f',
+            long = "fix-formatting",
+            conflicts_with = "message"
+        )]
         format: bool,
         /// Always show diff inside the editor.
         ///
         /// By default the diff will be shown unless it's large. The diff will always be shown if
         /// `--diff` is passed, regardless of the size of the diff.
-        #[clap(long = "diff", default_value_t, conflicts_with_all = &["no_diff", "format"])]
+        #[clap(long = "diff", default_value_t, conflicts_with_all = &["no_diff", "fix_formatting"])]
         diff: bool,
         /// Never show the diff inside the editor.
-        #[clap(long = "no-diff", default_value_t, conflicts_with_all = &["diff", "format"])]
+        #[clap(long = "no-diff", default_value_t, conflicts_with_all = &["diff", "fix_formatting"])]
         no_diff: bool,
     },
 
 
@@ -145,12 +145,13 @@ fn status_after_is_hidden_noop_compatibility_flag() {
         "move",
         "source",
         "target",
-        "--json",
+        "--format",
+        "json",
         "--status-after",
     ])
     .expect("parse legacy status-after flag");
 
-    assert!(args.json);
+    assert!(matches!(dbg!(args.format.format), OutputFormat::Json));
     assert!(args.legacy_status_after);
     assert!(!args.status_after);
 }
 
@@ -2,6 +2,18 @@ use clap::Parser as _;
 
 use crate::args::{Args, Subcommands};
 
+#[test]
+fn fix_formatting() {
+    let args = Args::try_parse_from(["but", "reword", "a", "--fix-formatting"]).unwrap();
+    let cmd = args.cmd.unwrap();
+
+    let Subcommands::Reword { format, .. } = cmd else {
+        panic!("expected reword command. Got {cmd:?}");
+    };
+
+    assert!(format);
+}
+
 #[test]
 fn always_show_diff() {
     let args = Args::try_parse_from(["but", "reword", "a", "--diff"]).unwrap();
Original file line number	Diff line number	Diff line change
`@@ -230,11 +230,11 @@`
`230`	`230`	`"script": [`
`231`	`231`	`{`
`232`	`232`	`"type": "input",`
`233`		`- "lines": ["# Everything takes --json"]`
	`233`	`+ "lines": ["# Everything takes --format json"]`
`234`	`234`	`},`
`235`	`235`	`{`
`236`	`236`	`"type": "input",`
`237`		`- "lines": ["$ but --json branch new feature/ai-integration \| jq ."]`
	`237`	`+ "lines": ["$ but --format json branch new feature/ai-integration \| jq ."]`
`238`	`238`	`},`
`239`	`239`	`{`
`240`	`240`	`"type": "output",`
`@@ -247,7 +247,7 @@`
`247`	`247`	`},`
`248`	`248`	`{`
`249`	`249`	`"type": "input",`
`250`		`- "lines": ["$ but show -j 90fe \| jq ."]`
	`250`	`+ "lines": ["$ but show --format json 90fe \| jq ."]`
`251`	`251`	`},`
`252`	`252`	`{`
`253`	`253`	`"type": "output",`
`@@ -265,7 +265,7 @@`
`265`	`265`	`},`
`266`	`266`	`{`
`267`	`267`	`"type": "input",`
`268`		`- "lines": ["$ but --json status \| jq '.stacks[].branches[].commits[]'"]`
	`268`	`+ "lines": ["$ but --format json status \| jq '.stacks[].branches[].commits[]'"]`
`269`	`269`	`},`
`270`	`270`	`{`
`271`	`271`	`"type": "output",`