GrayCodeAI
diff --git a/‎internal/evolution/analysis.go‎
Lines changed: 170 additions & 0 deletions b/‎internal/evolution/analysis.go‎
Lines changed: 170 additions & 0 deletions
diff --git a/‎internal/evolution/engine.go‎
Lines changed: 27 additions & 0 deletions b/‎internal/evolution/engine.go‎
Lines changed: 27 additions & 0 deletions
diff --git a/‎internal/evolution/git.go‎
Lines changed: 9 additions & 1 deletion b/‎internal/evolution/git.go‎
Lines changed: 9 additions & 1 deletion
diff --git a/‎internal/evolution/git_test.go‎
Lines changed: 5 additions & 3 deletions b/‎internal/evolution/git_test.go‎
Lines changed: 5 additions & 3 deletions
diff --git a/‎internal/evolution/phases.go‎
Lines changed: 34 additions & 7 deletions b/‎internal/evolution/phases.go‎
Lines changed: 34 additions & 7 deletions
diff --git a/‎internal/evolution/prompts.go‎
Lines changed: 24 additions & 12 deletions b/‎internal/evolution/prompts.go‎
Lines changed: 24 additions & 12 deletions
@@ -0,0 +1,170 @@
+package evolution
+
+import (
+	"os/exec"
+	"path/filepath"
+	"sort"
+	"strings"
+)
+
+// CodeAnalysis holds analysis results for the codebase.
+type CodeAnalysis struct {
+	TODOs      []string // file:line: content
+	Hotspots   []string // most changed files
+	NoTestPkgs []string // packages without test files
+	BuildOK    bool
+	TestOK     bool
+}
+
+// AnalyzeCodebase scans the repo for improvement opportunities.
+func AnalyzeCodebase(repoPath string) CodeAnalysis {
+	analysis := CodeAnalysis{BuildOK: true, TestOK: true}
+
+	// Check build
+	if err := exec.Command("go", "build", "./...").Run(); err != nil {
+		analysis.BuildOK = false
+	}
+
+	// Check tests
+	if err := exec.Command("go", "test", "./...").Run(); err != nil {
+		analysis.TestOK = false
+	}
+
+	// Find TODOs/FIXMEs
+	analysis.TODOs = findTODOs(repoPath)
+
+	// Find hotspots (most changed files)
+	analysis.Hotspots = findHotspots(repoPath)
+
+	// Find packages without tests
+	analysis.NoTestPkgs = findNoTestPackages(repoPath)
+
+	return analysis
+}
+
+// FormatAnalysis returns a human-readable summary for the agent.
+func (a CodeAnalysis) FormatAnalysis() string {
+	var sb strings.Builder
+
+	if !a.BuildOK {
+		sb.WriteString("🔴 BUILD BROKEN — fix this first!\n\n")
+	}
+	if !a.TestOK {
+		sb.WriteString("🔴 TESTS FAILING — fix this first!\n\n")
+	}
+
+	if len(a.TODOs) > 0 {
+		sb.WriteString("## TODOs found in code\n\n")
+		limit := 10
+		if len(a.TODOs) < limit {
+			limit = len(a.TODOs)
+		}
+		for _, todo := range a.TODOs[:limit] {
+			sb.WriteString("- " + todo + "\n")
+		}
+		sb.WriteString("\n")
+	}
+
+	if len(a.Hotspots) > 0 {
+		sb.WriteString("## Most changed files (hotspots)\n\n")
+		limit := 5
+		if len(a.Hotspots) < limit {
+			limit = len(a.Hotspots)
+		}
+		for _, h := range a.Hotspots[:limit] {
+			sb.WriteString("- " + h + "\n")
+		}
+		sb.WriteString("\n")
+	}
+
+	if len(a.NoTestPkgs) > 0 {
+		sb.WriteString("## Packages without tests\n\n")
+		for _, pkg := range a.NoTestPkgs {
+			sb.WriteString("- " + pkg + "\n")
+		}
+		sb.WriteString("\n")
+	}
+
+	return sb.String()
+}
+
+func findTODOs(repoPath string) []string {
+	out, err := exec.Command("grep", "-rn", "--include=*.go",
+		"TODO\\|FIXME\\|HACK\\|XXX",
+		filepath.Join(repoPath, "cmd"),
+		filepath.Join(repoPath, "internal"),
+	).CombinedOutput()
+	if err != nil {
+		return nil
+	}
+
+	var results []string
+	for _, line := range strings.Split(strings.TrimSpace(string(out)), "\n") {
+		if line == "" {
+			continue
+		}
+		// Strip repo path prefix
+		line = strings.TrimPrefix(line, repoPath+"/")
+		results = append(results, line)
+	}
+	return results
+}
+
+func findHotspots(repoPath string) []string {
+	out, err := exec.Command("git", "-C", repoPath, "log", "--pretty=format:",
+		"--name-only", "-50").CombinedOutput()
+	if err != nil {
+		return nil
+	}
+
+	counts := map[string]int{}
+	for _, line := range strings.Split(string(out), "\n") {
+		line = strings.TrimSpace(line)
+		if line == "" || strings.HasSuffix(line, "_test.go") {
+			continue
+		}
+		counts[line]++
+	}
+
+	type entry struct {
+		name  string
+		count int
+	}
+	var entries []entry
+	for name, count := range counts {
+		entries = append(entries, entry{name, count})
+	}
+	sort.Slice(entries, func(i, j int) bool {
+		return entries[i].count > entries[j].count
+	})
+
+	var results []string
+	limit := 10
+	if len(entries) < limit {
+		limit = len(entries)
+	}
+	for _, e := range entries[:limit] {
+		results = append(results, e.name+" (changed "+string(rune('0'+e.count))+"x)")
+	}
+	return results
+}
+
+func findNoTestPackages(repoPath string) []string {
+	out, err := exec.Command("go", "list", "./...").Output()
+	if err != nil {
+		return nil
+	}
+
+	var noTest []string
+	for _, pkg := range strings.Split(strings.TrimSpace(string(out)), "\n") {
+		if pkg == "" || strings.Contains(pkg, "vendor") {
+			continue
+		}
+		// Check if package has test files
+		testOut, _ := exec.Command("go", "list", "-f", "{{.TestGoFiles}}", pkg).Output()
+		if strings.TrimSpace(string(testOut)) == "[]" {
+			noTest = append(noTest, pkg)
+		}
+	}
+	return noTest
+}
@@ -365,3 +365,30 @@ func (e *Engine) handlePRReviewAndMerge(ctx context.Context, p iteragent.Provide
 
 	_ = e.switchToMain(ctx)
 }
+
+// auditLog appends a tool call or error to .iterate/audit.jsonl for debugging.
+func (e *Engine) auditLog(eventType, tool, detail string) {
+	auditPath := filepath.Join(e.repoPath, ".iterate", "audit.jsonl")
+	_ = os.MkdirAll(filepath.Dir(auditPath), 0o755)
+
+	entry := map[string]string{
+		"ts":   time.Now().UTC().Format(time.RFC3339),
+		"type": eventType,
+		"tool": tool,
+	}
+	if detail != "" {
+		// Truncate long details
+		if len(detail) > 200 {
+			detail = detail[:200] + "..."
+		}
+		entry["detail"] = detail
+	}
+
+	data, _ := json.Marshal(entry)
+	f, err := os.OpenFile(auditPath, os.O_APPEND|os.O_CREATE|os.O_WRONLY, 0o644)
+	if err != nil {
+		return
+	}
+	defer f.Close()
+	f.Write(append(data, '\n'))
+}
@@ -19,7 +19,15 @@ func (e *Engine) runTool(ctx context.Context, name string, args map[string]strin
 	if !ok {
 		return "", fmt.Errorf("tool %q not found", name)
 	}
-	return tool.Execute(ctx, args)
+
+	// Audit log
+	e.auditLog("tool_call", name, args["cmd"])
+
+	result, err := tool.Execute(ctx, args)
+	if err != nil {
+		e.auditLog("tool_error", name, err.Error())
+	}
+	return result, err
 }
 
 func (e *Engine) hasChanges(ctx context.Context) (bool, error) {
 
@@ -34,9 +34,11 @@ func initGitRepo(t *testing.T, dir string) {
 			t.Fatalf("%v failed: %v\n%s", c.args, err, out)
 		}
 	}
+	// Add .gitignore to exclude .iterate/ directory
+	os.WriteFile(filepath.Join(dir, ".gitignore"), []byte(".iterate/\n"), 0o644)
 	// initial commit so HEAD exists
 	os.WriteFile(filepath.Join(dir, "README.md"), []byte("# test\n"), 0o644)
-	cmd := exec.Command("git", "add", "README.md")
+	cmd := exec.Command("git", "add", "README.md", ".gitignore")
 	cmd.Dir = dir
 	cmd.CombinedOutput()
 	cmd = exec.Command("git", "commit", "-m", "init")
@@ -725,8 +727,8 @@ func TestHasChanges_WithIgnoredFiles(t *testing.T) {
 	dir := t.TempDir()
 	initGitRepo(t, dir)
 
-	// Create .gitignore
-	os.WriteFile(filepath.Join(dir, ".gitignore"), []byte("*.tmp\n"), 0o644)
+	// Create .gitignore with both patterns
+	os.WriteFile(filepath.Join(dir, ".gitignore"), []byte("*.tmp\n.iterate/\n"), 0o644)
 	cmd := exec.Command("git", "add", ".gitignore")
 	cmd.Dir = dir
 	cmd.CombinedOutput()
 
@@ -69,8 +69,14 @@ func buildPlanPrompt(repoPath, journal, day, issues string) string {
 	learnings, _ := os.ReadFile(filepath.Join(repoPath, "memory", "ACTIVE_LEARNINGS.md"))
 	ciStatus, _ := os.ReadFile(filepath.Join(repoPath, ".iterate", "ci_status.txt"))
 
+	// Run codebase analysis for smarter task selection
+	analysis := AnalyzeCodebase(repoPath)
+	analysisStr := analysis.FormatAnalysis()
+
 	var sb strings.Builder
 	appendPlanInstructions(&sb, ciStatus, day)
+	sb.WriteString("## Codebase Analysis\n\n")
+	sb.WriteString(analysisStr)
 	appendPlanContext(&sb, learnings, journal, issues)
 	return sb.String()
 }
@@ -165,9 +171,30 @@ func (e *Engine) RunImplementPhase(ctx context.Context, p iteragent.Provider) er
 	return nil
 }
 
-// executeTask runs a single task, reverts on failure.
+// executeTask runs a single task. On failure, reverts and retries once with error context.
 func (e *Engine) executeTask(ctx context.Context, p iteragent.Provider, task planTask, systemPrompt string, tools []iteragent.Tool, skills *iteragent.SkillSet, protectedWarning string) {
-	userMsg := fmt.Sprintf("Implement Task %d: %s\n\n%s\n\nAfter implementing, run: go build ./... && go test ./...\nThen commit your changes.", task.Number, task.Description, protectedWarning)
+	if ok := e.runTaskAttempt(ctx, p, task, systemPrompt, tools, skills, protectedWarning, ""); ok {
+		return
+	}
+
+	// First attempt failed. Retry with error context.
+	e.logger.Info("retrying task after failure", "number", task.Number)
+	v := e.verify(ctx)
+	errorCtx := fmt.Sprintf("Previous attempt failed. Build passed: %v, Test passed: %v. Fix the errors and try again.", v.BuildPassed, v.TestPassed)
+	if ok := e.runTaskAttempt(ctx, p, task, systemPrompt, tools, skills, protectedWarning, errorCtx); ok {
+		e.logger.Info("task succeeded on retry", "number", task.Number)
+	} else {
+		e.logger.Warn("task failed after retry, skipping", "number", task.Number)
+	}
+}
+
+// runTaskAttempt executes one attempt at a task. Returns true on success.
+func (e *Engine) runTaskAttempt(ctx context.Context, p iteragent.Provider, task planTask, systemPrompt string, tools []iteragent.Tool, skills *iteragent.SkillSet, protectedWarning, extraContext string) bool {
+	userMsg := fmt.Sprintf("Implement Task %d: %s\n\n%s", task.Number, task.Description, protectedWarning)
+	if extraContext != "" {
+		userMsg += "\n\n" + extraContext
+	}
+	userMsg += "\n\nAfter implementing, run: go build ./... && go test ./...\nThen commit your changes."
 
 	a := e.newAgent(p, tools, systemPrompt, skills)
 	var taskOutput string
@@ -183,26 +210,26 @@ func (e *Engine) executeTask(ctx context.Context, p iteragent.Provider, task pla
 	a.Finish()
 
 	if taskErr != nil {
-		e.logger.Warn("task failed, reverting", "number", task.Number, "err", taskErr)
+		e.logger.Warn("task error", "number", task.Number, "err", taskErr)
 		_ = e.revert(ctx)
-		return
+		return false
 	}
 
 	if violations, _ := e.verifyProtected(ctx); len(violations) > 0 {
 		e.logger.Warn("protected files modified, reverting", "number", task.Number, "files", violations)
 		_ = e.revert(ctx)
-		return
+		return false
 	}
 
 	v := e.verify(ctx)
 	if !v.BuildPassed || !v.TestPassed {
 		e.logger.Warn("verification failed, reverting", "number", task.Number, "build", v.BuildPassed, "test", v.TestPassed)
 		_ = e.revert(ctx)
-		return
+		return false
 	}
 
 	_ = e.appendLearningJSONL(firstLine(extractCommitMessage(taskOutput)), "evolution", task.Description, "")
-	_ = taskOutput
+	return true
 }
 
 // loadImplementContext prepares system prompt, tools, and skills for implementation.
 
@@ -18,32 +18,43 @@ func buildSystemPrompt(repoPath, identity string) string {
 ## Personality
 %s
 
-## Tool call format
+## Available Tools
 
-To call a tool, output a fenced code block with language "tool":
+You have these tools. USE THEM. Do not just describe what you would do — actually do it.
 
+### read_file — Read a file
 `+"```"+`tool
-{"tool":"tool_name","args":{"key":"value"}}
+{"tool":"read_file","args":{"path":"path/to/file.go"}}
 `+"```"+`
 
-Examples:
-
-Read a file:
+### write_file — Write/create a file
 `+"```"+`tool
-{"tool":"read_file","args":{"path":"internal/evolution/engine.go"}}
+{"tool":"write_file","args":{"path":"SESSION_PLAN.md","content":"## Session Plan\n\nSession Title: My task\n\n### Task 1: Do something\nFiles: cmd/foo.go\nDescription: Fix the thing\nIssue: none\n\n### Issue Responses\n"}}
 `+"```"+`
 
-Write a file:
+### edit_file — Edit part of a file
 `+"```"+`tool
-{"tool":"write_file","args":{"path":"SESSION_PLAN.md","content":"## Session Plan\n\nSession Title: Fix nil pointer\n\n### Task 1: Fix nil check\nFiles: cmd/iterate/repl.go\nDescription: Add nil check on line 47\nIssue: none\n\n### Issue Responses\n"}}
+{"tool":"edit_file","args":{"path":"cmd/foo.go","old_string":"old code here","new_string":"new code here"}}
 `+"```"+`
 
-Run a bash command:
+### bash — Run a shell command
 `+"```"+`tool
 {"tool":"bash","args":{"cmd":"go test ./..."}}
 `+"```"+`
 
-	CRITICAL: You MUST use this format to call tools. Do NOT just describe what you would do.`,
+### list_files — List files in a directory
+`+"```"+`tool
+{"tool":"list_files","args":{"path":"cmd/iterate"}}
+`+"```"+`
+
+## Rules
+
+1. ALWAYS use tools to read files before editing them
+2. After writing code, ALWAYS run: go build ./... && go test ./...
+3. If tests fail, fix the code and try again
+4. If you need to create SESSION_PLAN.md, use write_file
+5. Be direct. No explanations. Just act.
+6. One tool call at a time. Wait for results before next action.`,
 		identity,
 		string(personality),
 	)
@@ -55,6 +66,7 @@ func buildUserMessage(repoPath, journal, issues string) string {
 	var sb strings.Builder
 	sb.WriteString("## Your task\n\n")
 	sb.WriteString("Assess your codebase, find one meaningful improvement, implement it, test it, and commit it.\n\n")
+	sb.WriteString("Start by listing files with list_files, then read the source code.\n\n")
 
 	if len(learnings) > 0 {
 		l := string(learnings)
@@ -79,6 +91,6 @@ func buildUserMessage(repoPath, journal, issues string) string {
 		sb.WriteString(issues + "\n")
 	}
 
-	sb.WriteString("Begin your self-assessment now.")
+	sb.WriteString("Begin now. Use tools. Don't just describe — act.")
 	return sb.String()
 }