BlackVectorOps
diff --git a/‎.github/workflows/semantic_analysis.yml‎
Lines changed: 115 additions & 116 deletions b/‎.github/workflows/semantic_analysis.yml‎
Lines changed: 115 additions & 116 deletions
diff --git a/‎internal/cli/index.go‎
Lines changed: 4 additions & 1 deletion b/‎internal/cli/index.go‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎pkg/analysis/ir/benchmark_test.go‎
Lines changed: 114 additions & 0 deletions b/‎pkg/analysis/ir/benchmark_test.go‎
Lines changed: 114 additions & 0 deletions
@@ -36,6 +36,11 @@ jobs:
           # Verify binary works
           ./bin/sfw --version || ./bin/sfw help || true
 
+      - name: Vendor Dependencies
+        # Vendor modules into workspace so they're available inside the sandbox.
+        # The sandbox only mounts the workspace, not GOMODCACHE (/home/runner/go/pkg/mod).
+        run: go mod vendor
+
       - name: Determine Mode
         id: mode
         run: |
@@ -88,129 +93,123 @@ jobs:
              echo "has_go_files=false" >> $GITHUB_OUTPUT
           fi
 
-      - name: Run Semantic Analysis (Sandboxed)
-        uses: geomys/sandboxed-step@v1.2.0
-        with:
-          disable-network: 'true'
-          # CONTEXT INJECTION:
-          # We inject vars via interpolation. We write to a local artifact
-          # instead of trying to hit the runner's step summary directly.
-          run: |
-            export MODE="${{ steps.mode.outputs.mode }}"
-            export WORKTREE_DIR="${{ steps.prep.outputs.worktree_dir }}"
-            export HAS_GO="${{ steps.prep.outputs.has_go_files }}"
-            export SFW_SANDBOX_ID="1"
-            
-            # Strict mode enabled after exports
-            set -euo pipefail
-
-            # Define local report artifact (Safe Write)
-            REPORT_FILE="scan_report.md"
-
-            echo "## Semantic Analysis Report ($MODE)" >> "$REPORT_FILE"
-            echo "| File | Status | Match % |" >> "$REPORT_FILE"
-            echo "| :--- | :--- | :--- |" >> "$REPORT_FILE"
-
-            if [ "$HAS_GO" != "true" ]; then
-                echo "No Go files changed." >> "$REPORT_FILE"
-                exit 0
+      # Install dependencies for sfw's internal sandbox (AppArmor bypass via aa-exec)
+      - name: Install Sandbox Dependencies
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y apparmor-utils
+
+      - name: Run Semantic Analysis
+        env:
+          MODE: ${{ steps.mode.outputs.mode }}
+          WORKTREE_DIR: ${{ steps.prep.outputs.worktree_dir }}
+          HAS_GO: ${{ steps.prep.outputs.has_go_files }}
+          # Use vendored dependencies - sandbox can't access GOMODCACHE
+          GOFLAGS: "-mod=vendor"
+          GOPROXY: "off"
+        run: |
+          set -euo pipefail
+
+          REPORT_FILE="scan_report.md"
+
+          echo "## Semantic Analysis Report ($MODE)" >> "$REPORT_FILE"
+          echo "| File | Status | Match % |" >> "$REPORT_FILE"
+          echo "| :--- | :--- | :--- |" >> "$REPORT_FILE"
+
+          if [ "$HAS_GO" != "true" ]; then
+              echo "No Go files changed." >> "$REPORT_FILE"
+              exit 0
+          fi
+
+          ERROR_COUNT=0
+          LOGIC_FAIL=0
+
+          # Process the pre-calculated diff stream
+          while IFS= read -r -d '' status; do
+            case "$status" in
+              R*|C*)
+                 IFS= read -r -d '' old_path
+                 IFS= read -r -d '' new_path
+                 OLD_FILE_REF="$old_path"
+                 NEW_FILE_REF="$new_path"
+                 ;;
+              *)
+                 IFS= read -r -d '' path
+                 OLD_FILE_REF="$path"
+                 NEW_FILE_REF="$path"
+                 ;;
+            esac
+
+            if [[ "$NEW_FILE_REF" != *.go ]] && [[ "$OLD_FILE_REF" != *.go ]]; then continue; fi
+
+            if [ -f "$NEW_FILE_REF" ]; then
+                NEW_FILE="$NEW_FILE_REF"
+            else
+                NEW_FILE=""
             fi
 
-            # Check for required tools inside sandbox
-            if ! command -v jq >/dev/null; then
-                echo "::error::'jq' is missing from the sandbox environment."
-                exit 1
+            OLD_FILE="$WORKTREE_DIR/$OLD_FILE_REF"
+            if [ ! -f "$OLD_FILE" ]; then
+                OLD_FILE=""
             fi
 
-            ERROR_COUNT=0
-            LOGIC_FAIL=0
-
-            # Process the pre-calculated diff stream
-            while IFS= read -r -d '' status; do
-              case "$status" in
-                R*|C*)
-                   IFS= read -r -d '' old_path
-                   IFS= read -r -d '' new_path
-                   OLD_FILE_REF="$old_path"
-                   NEW_FILE_REF="$new_path"
-                   ;;
-                *)
-                   IFS= read -r -d '' path
-                   OLD_FILE_REF="$path"
-                   NEW_FILE_REF="$path"
-                   ;;
-              esac
-
-              if [[ "$NEW_FILE_REF" != *.go ]] && [[ "$OLD_FILE_REF" != *.go ]]; then continue; fi
-
-              if [ -f "$NEW_FILE_REF" ]; then
-                  NEW_FILE="$NEW_FILE_REF"
-              else
-                  NEW_FILE=""
-              fi
-
-              OLD_FILE="$WORKTREE_DIR/$OLD_FILE_REF"
-              if [ ! -f "$OLD_FILE" ]; then
-                  OLD_FILE=""
-              fi
-
-              if [[ -z "$NEW_FILE" ]] && [[ -z "$OLD_FILE" ]]; then continue; fi
-
-              if [[ -z "$OLD_FILE" ]]; then
-                  echo "| \`$NEW_FILE_REF\` | New File | N/A |" >> "$REPORT_FILE"
-                  continue
-              fi
-
-              if [[ -z "$NEW_FILE" ]]; then
-                  echo "| \`$OLD_FILE_REF\` | Deleted | N/A |" >> "$REPORT_FILE"
-                  continue
-              fi
-
-              # Execute SFW with stderr capture
-              if ! OUTPUT=$(./bin/sfw diff "$OLD_FILE" "$NEW_FILE" 2>&1); then
-                  echo "::error::sfw failed to process $NEW_FILE_REF"
-                  ERROR_COUNT=$((ERROR_COUNT + 1))
-                  continue
-              fi
-
-              # Validate JSON
-              if ! echo "$OUTPUT" | jq -e . >/dev/null 2>&1; then
-                  echo "::error::Invalid JSON output for $NEW_FILE_REF"
-                  ERROR_COUNT=$((ERROR_COUNT + 1))
-                  continue
-              fi
-
-              PCT=$(echo "$OUTPUT" | jq -r '.summary.semantic_match_pct // 0')
-              MODIFIED=$(echo "$OUTPUT" | jq -r '.summary.modified // 0')
-              IS_BELOW_100=$(echo "$OUTPUT" | jq -r 'if (.summary.semantic_match_pct // 0) < 100 then "true" else "false" end')
-
-              if [ "$IS_BELOW_100" = "true" ]; then
-                  STATUS_ICON="Modified ($MODIFIED)"
-                  echo "| \`$NEW_FILE_REF\` | $STATUS_ICON | **$PCT%** |" >> "$REPORT_FILE"
-
-                  if [ "$MODE" == "BLOCKER" ]; then
-                      echo "::error file=$NEW_FILE_REF::Logic change detected in safe refactor! ($PCT%)"
-                      LOGIC_FAIL=1
-                  fi
-              else
-                  STATUS_ICON="Preserved"
-                  echo "| \`$NEW_FILE_REF\` | $STATUS_ICON | **$PCT%** |" >> "$REPORT_FILE"
-              fi
-
-            done < diff_stream.bin
-
-            if [ $ERROR_COUNT -gt 0 ]; then
-                echo "" >> "$REPORT_FILE"
-                echo "**CI FAILED**: Tool execution failures detected." >> "$REPORT_FILE"
-                exit 1
+            if [[ -z "$NEW_FILE" ]] && [[ -z "$OLD_FILE" ]]; then continue; fi
+
+            if [[ -z "$OLD_FILE" ]]; then
+                echo "| \`$NEW_FILE_REF\` | New File | N/A |" >> "$REPORT_FILE"
+                continue
             fi
 
-            if [ $LOGIC_FAIL -eq 1 ]; then
-                echo "" >> "$REPORT_FILE"
-                echo "**CI FAILED**: Logic changed in 'semantic-safe' PR." >> "$REPORT_FILE"
-                exit 1
+            if [[ -z "$NEW_FILE" ]]; then
+                echo "| \`$OLD_FILE_REF\` | Deleted | N/A |" >> "$REPORT_FILE"
+                continue
             fi
 
+            # Execute SFW diff (sfw handles its own sandboxing internally)
+            if ! OUTPUT=$(./bin/sfw diff "$OLD_FILE" "$NEW_FILE" 2>&1); then
+                echo "::error::sfw failed to process $NEW_FILE_REF"
+                ERROR_COUNT=$((ERROR_COUNT + 1))
+                continue
+            fi
+
+            # Validate JSON
+            if ! echo "$OUTPUT" | jq -e . >/dev/null 2>&1; then
+                echo "::error::Invalid JSON output for $NEW_FILE_REF"
+                ERROR_COUNT=$((ERROR_COUNT + 1))
+                continue
+            fi
+
+            PCT=$(echo "$OUTPUT" | jq -r '.summary.semantic_match_pct // 0')
+            MODIFIED=$(echo "$OUTPUT" | jq -r '.summary.modified // 0')
+            IS_BELOW_100=$(echo "$OUTPUT" | jq -r 'if (.summary.semantic_match_pct // 0) < 100 then "true" else "false" end')
+
+            if [ "$IS_BELOW_100" = "true" ]; then
+                STATUS_ICON="Modified ($MODIFIED)"
+                echo "| \`$NEW_FILE_REF\` | $STATUS_ICON | **$PCT%** |" >> "$REPORT_FILE"
+
+                if [ "$MODE" == "BLOCKER" ]; then
+                    echo "::error file=$NEW_FILE_REF::Logic change detected in safe refactor! ($PCT%)"
+                    LOGIC_FAIL=1
+                fi
+            else
+                STATUS_ICON="Preserved"
+                echo "| \`$NEW_FILE_REF\` | $STATUS_ICON | **$PCT%** |" >> "$REPORT_FILE"
+            fi
+
+          done < diff_stream.bin
+
+          if [ $ERROR_COUNT -gt 0 ]; then
+              echo "" >> "$REPORT_FILE"
+              echo "**CI FAILED**: Tool execution failures detected." >> "$REPORT_FILE"
+              exit 1
+          fi
+
+          if [ $LOGIC_FAIL -eq 1 ]; then
+              echo "" >> "$REPORT_FILE"
+              echo "**CI FAILED**: Logic changed in 'semantic-safe' PR." >> "$REPORT_FILE"
+              exit 1
+          fi
+
       - name: Publish Analysis Report
         if: always()
         # This runs on the host, so it has access to GITHUB_STEP_SUMMARY.
@@ -227,4 +226,4 @@ jobs:
         run: |
           if [ -d "$WORKTREE_DIR" ]; then
              git worktree remove --force "$WORKTREE_DIR" 2>/dev/null || rm -rf "$WORKTREE_DIR"
-          fi
+          fi
@@ -166,10 +166,13 @@ func RunIndexJSON(target string, results []diff.FingerprintResult, name, severit
 			Created: time.Now().Format("2006-01-02"),
 		}
 
-		scanner.AddSignature(&sig)
 		indexed = append(indexed, sig)
 	}
 
+	if err := scanner.AddSignatures(indexed); err != nil {
+		return nil, 0, err
+	}
+
 	if err := scanner.SaveDatabase(dbPath); err != nil {
 		return nil, 0, err
 	}
 
@@ -0,0 +1,114 @@
+package ir_test
+
+import (
+	"go/token"
+	"os"
+	"path/filepath"
+	"strings"
+	"testing"
+
+	"github.com/BlackVectorOps/semantic_firewall/v3/pkg/analysis/ir"
+	"golang.org/x/tools/go/packages"
+	"golang.org/x/tools/go/ssa"
+)
+
+func compileForBenchmark(b *testing.B, src, funcName string) *ssa.Function {
+	b.Helper()
+	dir, err := os.MkdirTemp("", "ssa-bench-")
+	if err != nil {
+		b.Fatalf("failed to create temp dir: %v", err)
+	}
+	defer os.RemoveAll(dir)
+
+	modPath := filepath.Join(dir, "go.mod")
+	if err := os.WriteFile(modPath, []byte("module testmod\n\ngo 1.23\n"), 0644); err != nil {
+		b.Fatalf("failed to create go.mod: %v", err)
+	}
+
+	path := filepath.Join(dir, "main.go")
+	if err := os.WriteFile(path, []byte(src), 0644); err != nil {
+		b.Fatalf("write source: %v", err)
+	}
+
+	env := append(os.Environ(), "GO111MODULE=on", "GOPROXY=off", "CGO_ENABLED=0")
+
+	cfg := &packages.Config{
+		Dir:  dir,
+		Mode: packages.LoadAllSyntax,
+		Fset: token.NewFileSet(),
+		Env:  env,
+	}
+
+	pkgs, err := packages.Load(cfg, "file="+path)
+	if err != nil {
+		b.Fatalf("packages.Load: %v", err)
+	}
+	if packages.PrintErrors(pkgs) > 0 {
+		b.Fatal("compilation errors in test source")
+	}
+
+	prog, _, err := ir.BuildSSAFromPackages(pkgs)
+	if err != nil {
+		b.Fatalf("BuildSSA: %v", err)
+	}
+
+	for _, pkg := range pkgs {
+		ssaPkg := prog.Package(pkg.Types)
+		if ssaPkg == nil {
+			continue
+		}
+		for _, member := range ssaPkg.Members {
+			if fn, ok := member.(*ssa.Function); ok {
+				if fn.Name() == funcName || strings.HasSuffix(fn.Name(), "."+funcName) {
+					return fn
+				}
+			}
+		}
+	}
+
+	b.Fatalf("function %q not found in SSA program", funcName)
+	return nil
+}
+
+func BenchmarkCanonicalizeFunction(b *testing.B) {
+	// Source code with various instruction types to exercise different paths
+	src := `package main
+
+	func everything(ch chan int, m map[string]interface{}) interface{} {
+		// Defer
+		defer func() { recover() }()
+
+		res := 0
+
+		// Select
+		select {
+		case x := <-ch:
+			// Map Update & Interface
+			m["val"] = x
+			res = x
+		default:
+			// MakeSlice & Go
+			go func() { _ = make([]int, 10, 20) }()
+			res = 1
+		}
+
+		// Type Assert
+		if val, ok := m["val"].(int); ok {
+			return val * 2
+		}
+
+		return res
+	}`
+
+	fn := compileForBenchmark(b, src, "everything")
+	// Use default policy
+	policy := ir.DefaultLiteralPolicy
+
+	b.ResetTimer()
+	for i := 0; i < b.N; i++ {
+		// Acquire/Release per iteration to simulate real usage
+		c := ir.AcquireCanonicalizer(policy)
+		c.CanonicalizeFunction(fn)
+		ir.ReleaseCanonicalizer(c)
+	}
+}
Original file line number	Diff line number	Diff line change
`@@ -166,10 +166,13 @@ func RunIndexJSON(target string, results []diff.FingerprintResult, name, severit`
`166`	`166`	`Created: time.Now().Format("2006-01-02"),`
`167`	`167`	`}`
`168`	`168`
`169`		`- scanner.AddSignature(&sig)`
`170`	`169`	`indexed = append(indexed, sig)`
`171`	`170`	`}`
`172`	`171`
	`172`	`+ if err := scanner.AddSignatures(indexed); err != nil {`
	`173`	`+ return nil, 0, err`
	`174`	`+ }`
	`175`	`+`
`173`	`176`	`if err := scanner.SaveDatabase(dbPath); err != nil {`
`174`	`177`	`return nil, 0, err`
`175`	`178`	`}`