supabase-community
diff --git a/‎Cargo.lock‎
Lines changed: 897 additions & 837 deletions b/‎Cargo.lock‎
Lines changed: 897 additions & 837 deletions
diff --git a/‎crates/pgls_pretty_print/Cargo.toml‎
Lines changed: 1 addition & 0 deletions b/‎crates/pgls_pretty_print/Cargo.toml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎crates/pgls_pretty_print/nodes.txt‎
Lines changed: 0 additions & 11849 deletions b/‎crates/pgls_pretty_print/nodes.txt‎
Lines changed: 0 additions & 11849 deletions
diff --git a/‎crates/pgls_pretty_print/tests/normalize_coverage.rs‎
Lines changed: 204 additions & 0 deletions b/‎crates/pgls_pretty_print/tests/normalize_coverage.rs‎
Lines changed: 204 additions & 0 deletions
diff --git a/‎docs/features/formatting.md‎
Lines changed: 5 additions & 0 deletions b/‎docs/features/formatting.md‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎justfile‎
Lines changed: 0 additions & 117 deletions b/‎justfile‎
Lines changed: 0 additions & 117 deletions
diff --git a/‎scripts/pp-hook.sh‎
Lines changed: 0 additions & 48 deletions b/‎scripts/pp-hook.sh‎
Lines changed: 0 additions & 48 deletions
@@ -21,3 +21,4 @@ camino.workspace                  = true
 dir-test.workspace                = true
 insta.workspace                   = true
 pgls_statement_splitter.workspace = true
+regex.workspace                   = true
@@ -0,0 +1,204 @@
+//! Normalize Coverage Test
+//!
+//! This test verifies that all AST node types with `location` fields are handled
+//! in the `normalize.rs` clear_location function.
+//!
+//! When `libpg_query` is upgraded and new node types are added that have location
+//! fields, this test will fail and list exactly which types need to be added to
+//! the normalization code.
+//!
+//! ## When this test fails:
+//! 1. Look at the "Missing handlers" list
+//! 2. Add each missing type to `clear_location` in `normalize.rs`
+//! 3. For each type, set `(*n).location = 0;` at minimum
+//! 4. Check if the type needs additional normalization beyond location clearing
+
+use regex::Regex;
+use std::collections::HashSet;
+use std::fs;
+use std::path::PathBuf;
+
+/// Extract all struct names that have a `location: i32` field from protobuf.rs
+fn extract_types_with_location() -> HashSet<String> {
+    let manifest_dir = PathBuf::from(env!("CARGO_MANIFEST_DIR"));
+    let protobuf_path = manifest_dir
+        .parent()
+        .unwrap()
+        .join("pgls_query/src/protobuf.rs");
+
+    let content = fs::read_to_string(&protobuf_path)
+        .expect("Failed to read protobuf.rs - has it been generated?");
+
+    let mut types_with_location = HashSet::new();
+
+    // Match struct definitions and their fields
+    // Pattern: `pub struct TypeName {` followed by fields until `}`
+    let struct_re = Regex::new(r"pub struct (\w+)\s*\{([^}]+)\}").unwrap();
+    let location_field_re = Regex::new(r"pub location:\s*i32").unwrap();
+
+    for cap in struct_re.captures_iter(&content) {
+        let struct_name = cap[1].to_string();
+        let struct_body = &cap[2];
+
+        if location_field_re.is_match(struct_body) {
+            types_with_location.insert(struct_name);
+        }
+    }
+
+    types_with_location
+}
+
+/// Extract all NodeMut variants handled in clear_location from normalize.rs
+fn extract_handled_types() -> HashSet<String> {
+    let manifest_dir = PathBuf::from(env!("CARGO_MANIFEST_DIR"));
+    let normalize_path = manifest_dir.join("src/normalize.rs");
+
+    let content = fs::read_to_string(&normalize_path).expect("Failed to read normalize.rs");
+
+    // Find the clear_location function
+    let start = content
+        .find("fn clear_location")
+        .expect("Could not find clear_location function");
+    let end = content[start..]
+        .find("\n}\n\n")
+        .map(|i| start + i)
+        .unwrap_or(content.len());
+
+    let clear_location_body = &content[start..end];
+
+    // Extract NodeMut::TypeName patterns
+    let variant_re = Regex::new(r"NodeMut::(\w+)\(").unwrap();
+
+    variant_re
+        .captures_iter(clear_location_body)
+        .map(|cap| cap[1].to_string())
+        .collect()
+}
+
+/// Types that are known to not need location clearing in `clear_location`.
+/// These are either:
+/// - Internal types not directly in the AST (e.g., ParseResult, ScanResult)
+/// - Planner/executor nodes that don't appear in parsed SQL ASTs
+/// - Types handled in separate normalization functions
+/// - Types where location is handled via parent node traversal
+fn known_exceptions() -> HashSet<&'static str> {
+    [
+        // ===== Internal/container types =====
+        "ParseResult",
+        "ScanResult",
+        "ScanToken",
+        "Node",
+        "RawStmt", // location is stmt_location, handled separately
+        "Integer",
+        "Float",
+        "Boolean",
+        "List",
+        "IntList",
+        "OidList",
+        // ===== Planner/executor nodes (not in parser output) =====
+        // These are internal representations created during query planning,
+        // not during parsing. They won't appear in parsed SQL ASTs.
+        "Aggref",              // aggregate reference - planner node
+        "ArrayCoerceExpr",     // array coercion - planner node
+        "ArrayExpr",           // constructed array - planner node
+        "CoerceToDomain",      // domain coercion - planner node
+        "CoerceToDomainValue", // domain value coercion - planner node
+        "CoerceViaIo",         // I/O coercion - planner node
+        "CollateExpr",         // collation expression - planner node
+        "ConvertRowtypeExpr",  // row type conversion - planner node
+        "DistinctExpr",        // DISTINCT expression - planner node
+        "FuncExpr",            // function expression - planner node (FuncCall is parser)
+        "NullIfExpr",          // NULLIF expression - planner node
+        "OpExpr",              // operator expression - planner node (AExpr is parser)
+        "Param",               // query parameter - planner node (ParamRef is parser)
+        "RelabelType",         // type relabeling - planner node
+        "ScalarArrayOpExpr",   // scalar array op - planner node
+        "TableFunc",           // table function - planner node
+        "Var",                 // variable reference - planner node (ColumnRef is parser)
+        "WindowFunc",          // window function - planner node (FuncCall is parser)
+        // ===== Handled in separate normalization functions =====
+        "MergeSupportFunc", // handled in normalize_merge_support_func
+        "SqlValueFunction", // handled in normalize_sql_value_function
+        "WithClause",       // handled in normalize_merge_support_func_recursive
+        // ===== Handled via parent node =====
+        "JsonFormat",          // handled via JsonFuncExpr, JsonArrayConstructor, etc.
+        "JsonConstructorExpr", // internal JSON constructor - planner node
+        "JsonExpr",            // internal JSON expression - planner node
+        // ===== Parser nodes that need review =====
+        // These appear in parsed ASTs but may not need explicit handling
+        // if the pretty-print tests pass without them
+        "CteCycleClause",      // CTE CYCLE clause - rarely used
+        "CteSearchClause",     // CTE SEARCH clause - rarely used
+        "PartitionRangeDatum", // partition range datum - handled via PartitionBoundSpec
+        "PlAssignStmt",        // PL/pgSQL assignment - not standard SQL
+    ]
+    .into_iter()
+    .collect()
+}
+
+#[test]
+fn all_location_fields_are_normalized() {
+    let types_with_location = extract_types_with_location();
+    let handled_types = extract_handled_types();
+    let exceptions = known_exceptions();
+
+    let mut missing: Vec<_> = types_with_location
+        .iter()
+        .filter(|t| !handled_types.contains(*t) && !exceptions.contains(t.as_str()))
+        .collect();
+
+    missing.sort();
+
+    if !missing.is_empty() {
+        panic!(
+            "\n\n\
+            ========================================\n\
+            AST NORMALIZATION COVERAGE INCOMPLETE\n\
+            ========================================\n\n\
+            The following types have `location` fields but are NOT handled\n\
+            in the `clear_location` function in normalize.rs:\n\n\
+            {}\n\n\
+            To fix:\n\
+            1. Add a handler for each type in the `clear_location` match\n\
+            2. At minimum: `NodeMut::TypeName(n) => {{ (*n).location = 0; }}`\n\
+            3. Check if additional normalization is needed\n\n\
+            If a type should NOT be normalized, add it to `known_exceptions()`\n\
+            in this test file with a comment explaining why.\n\
+            ========================================\n",
+            missing
+                .iter()
+                .map(|t| format!("  - {}", t))
+                .collect::<Vec<_>>()
+                .join("\n")
+        );
+    }
+}
+
+#[test]
+fn no_obsolete_handlers() {
+    let types_with_location = extract_types_with_location();
+    let handled_types = extract_handled_types();
+
+    // Check for handlers that reference types that don't exist or don't have location
+    let mut obsolete: Vec<_> = handled_types
+        .iter()
+        .filter(|t| !types_with_location.contains(*t))
+        .collect();
+
+    obsolete.sort();
+
+    if !obsolete.is_empty() {
+        println!(
+            "\nNote: The following handlers in clear_location reference types \
+             that don't have a `location` field (they may have other fields being normalized):\n\
+             {}\n\
+             This is fine if the handler normalizes other fields, but worth reviewing.\n",
+            obsolete
+                .iter()
+                .map(|t| format!("  - {}", t))
+                .collect::<Vec<_>>()
+                .join("\n")
+        );
+    }
+    // This is just informational, not a failure
+}
@@ -2,6 +2,11 @@
 
 > **Preview Feature**: The formatter is currently in preview. We'd love feedback from early adopters! Please report any issues or unexpected output at [GitHub Issues](https://github.com/supabase-community/postgres-language-server/issues).
 
+## Known Limitations
+
+!!! warning "Comments are not yet supported"
+    SQL comments (`--` and `/* */`) will be removed during formatting. This is a temporary limitation that will be addressed in a future release. If your SQL files contain important comments, consider waiting for comment support before using the formatter on those files.
+
 The language server provides SQL formatting that produces consistent, readable code. Built on Postgres' own parser, the formatter ensures 100% syntax compatibility with your SQL.
 
 ## Configuration
 
@@ -158,120 +158,3 @@ quick-modify:
 show-logs:
     tail -f $(ls $PGLS_LOG_PATH/server.log.* | sort -t- -k2,2 -k3,3 -k4,4 | tail -n 1)
 
-# Run a codex agent with the given agentic prompt file.
-# Commented out by default to avoid accidental usage that may incur costs.
-agentic name:
-    codex exec --yolo "please read agentic/{{name}}.md and follow the instructions closely while continueing the described task. Make sure to understand recent Session History, Implementation Learnings and read all instructions. Continue until the task is complete."
-
-# === Pretty Printer Development ===
-
-# Run pretty printer agentic task (Stop hook auto-loops until tests pass)
-pp-agentic:
-    claude --dangerously-skip-permissions "Read agentic/pretty_printer.md and agentic/session_log.md. \
-    \
-    Your goal: Complete the pretty printer by fixing node implementations until ALL tests pass. \
-    \
-    Workflow: \
-    1. Run 'just pp-status' to see current state \
-    2. Run 'just pp-failing' to find failing tests \
-    3. Pick a failing test and debug with 'just pp-debug <name>' \
-    4. Fix the emit_* function in crates/pgls_pretty_print/src/nodes/*.rs \
-    5. Verify with 'just pp-test <pattern>' \
-    6. Accept valid snapshots with 'just pp-review' \
-    7. Repeat \
-    \
-    Follow the Implementation Learnings in pretty_printer.md. Update session_log.md with your progress."
-
-# Show pretty printer implementation status
-pp-status:
-    @./scripts/pp-status.sh
-
-# Test with pattern filter (e.g., just pp-test select_stmt)
-pp-test pattern:
-    cargo test -p pgls_pretty_print -- {{pattern}} --show-output
-
-# List failing tests
-pp-failing:
-    @cargo test -p pgls_pretty_print 2>&1 | grep "FAILED" | head -30
-
-# Debug a specific test with full output
-pp-debug name:
-    cargo test -p pgls_pretty_print {{name}} -- --show-output --nocapture
-
-# Review pending snapshots
-pp-review:
-    cargo insta review -p pgls_pretty_print
-
-# Accept all pending snapshots
-pp-accept:
-    cargo insta accept -p pgls_pretty_print
-
-# Analyze failure patterns
-pp-analyze:
-    @echo "=== Failure Analysis ===" && \
-    cargo test -p pgls_pretty_print 2>&1 | grep -oE "test_(single|multi)__[a-z0-9_]+" | sort | uniq -c | sort -rn | head -20
-
-# Run only single-statement tests (faster iteration)
-pp-single:
-    cargo test -p pgls_pretty_print test_single
-
-# Run only multi-statement tests
-pp-multi:
-    cargo test -p pgls_pretty_print test_multi
-
-# Short aliases (only for commands without required args)
-pps: pp-status
-ppf: pp-failing
-ppr: pp-review
-
-# ============================================================================
-# WASM Build
-# ============================================================================
-
-# Build WASM bindings (debug) - uses Nix if available
-build-wasm:
-    #!/usr/bin/env bash
-    if command -v nix &> /dev/null && [ -f crates/pgls_wasm/flake.nix ]; then
-        echo "Building with Nix..."
-        nix develop ./crates/pgls_wasm#default --command ./crates/pgls_wasm/build-wasm.sh
-    else
-        ./crates/pgls_wasm/build-wasm.sh
-    fi
-
-# Build WASM bindings (release) - uses Nix if available
-build-wasm-release:
-    #!/usr/bin/env bash
-    if command -v nix &> /dev/null && [ -f crates/pgls_wasm/flake.nix ]; then
-        echo "Building with Nix..."
-        nix develop ./crates/pgls_wasm#default --command ./crates/pgls_wasm/build-wasm.sh --release
-    else
-        ./crates/pgls_wasm/build-wasm.sh --release
-    fi
-
-# Build WASM using Nix (recommended)
-build-wasm-nix:
-    nix build ./crates/pgls_wasm#default
-
-# Enter WASM development shell with Nix
-wasm-shell:
-    nix develop ./crates/pgls_wasm#default
-
-# Check if WASM build prerequisites are installed
-check-wasm-prereqs:
-    @echo "Checking WASM build prerequisites..."
-    @command -v nix >/dev/null 2>&1 && echo "✓ Nix found (recommended)" || echo "○ Nix not found (optional but recommended)"
-    @command -v emcc >/dev/null 2>&1 && echo "✓ Emscripten (emcc) found" || echo "✗ Emscripten not found - install from https://emscripten.org or use Nix"
-    @rustup target list --installed 2>/dev/null | grep -q wasm32-unknown-emscripten && echo "✓ wasm32-unknown-emscripten target installed" || echo "✗ Missing target - run: rustup target add wasm32-unknown-emscripten"
-
-# Install WASM build prerequisites (non-Nix)
-install-wasm-prereqs:
-    rustup target add wasm32-unknown-emscripten
-    @echo ""
-    @echo "NOTE: You also need to install Emscripten SDK manually:"
-    @echo "  https://emscripten.org/docs/getting_started/downloads.html"
-    @echo ""
-    @echo "After installing, activate it with:"
-    @echo "  source /path/to/emsdk/emsdk_env.sh"
-    @echo ""
-    @echo "Or use Nix (recommended): just wasm-shell"
-