code
diff --git a/‎package-lock.json‎
Lines changed: 5 additions & 4 deletions b/‎package-lock.json‎
Lines changed: 5 additions & 4 deletions
diff --git a/‎package.json‎
Lines changed: 2 additions & 1 deletion b/‎package.json‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎src/agent/agentContext.test.ts‎
Lines changed: 5 additions & 5 deletions b/‎src/agent/agentContext.test.ts‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎src/agent/autonomous/agentCompletion.ts‎
Lines changed: 3 additions & 4 deletions b/‎src/agent/autonomous/agentCompletion.ts‎
Lines changed: 3 additions & 4 deletions
diff --git a/‎src/agent/autonomous/autonomousAgentRunner.ts‎
Lines changed: 1 addition & 5 deletions b/‎src/agent/autonomous/autonomousAgentRunner.ts‎
Lines changed: 1 addition & 5 deletions
diff --git a/‎src/cli/cli.ts‎
Lines changed: 4 additions & 2 deletions b/‎src/cli/cli.ts‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎src/cli/gen.ts‎
Lines changed: 5 additions & 3 deletions b/‎src/cli/gen.ts‎
Lines changed: 5 additions & 3 deletions
diff --git a/‎src/functions/scm/git.ts‎
Lines changed: 1 addition & 1 deletion b/‎src/functions/scm/git.ts‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/llm/multi-agent/blackberry.ts‎
Lines changed: 2 additions & 2 deletions b/‎src/llm/multi-agent/blackberry.ts‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/llm/multi-agent/reasoning-debate.ts‎
Lines changed: 7 additions & 7 deletions b/‎src/llm/multi-agent/reasoning-debate.ts‎
Lines changed: 7 additions & 7 deletions
@@ -49,6 +49,7 @@
     "test:postgres": " node --env-file=variables/test.env ./node_modules/mocha/bin/mocha -r esbuild-register -r \"./src/test/testSetup.ts\" \"src/modules/postgres/*.test.ts\" --timeout 10000",
     "test:mongo": "    node --env-file=variables/test.env ./node_modules/mocha/bin/mocha -r esbuild-register -r \"./src/test/testSetup.ts\" \"src/modules/mongo/*.test.ts\" --timeout 10000",
     "test:db": "       node --env-file=variables/test.env ./node_modules/mocha/bin/mocha -r esbuild-register -r \"./src/test/testSetup.ts\" \"src/modules/{firestore,mongo,postgres}/*.test.ts\" --timeout 10000",
+    "test:single": "   node --env-file=variables/test.env ./node_modules/mocha/bin/mocha -r esbuild-register -r \"./src/test/testSetup.ts\" --timeout 10000 --exit",
     "test:ci:firestore": "firebase emulators:exec --only firestore \"npm run test:firestore\"",
     "test:ci:postgres": " npm run test:postgres",
     "test:ci:mongo": "    npm run test:mongo",
@@ -99,7 +100,7 @@
     "@grpc/grpc-js": "^1.12.6",
     "@microsoft/tiktokenizer": "^1.0.8",
     "@mistralai/mistralai": "^1.7.1",
-    "@modelcontextprotocol/sdk": "^1.13.2",
+    "@modelcontextprotocol/sdk": "^1.17.1",
     "@mozilla/readability": "^0.6.0",
     "@octokit/request": "^5.1.0",
     "@openrouter/ai-sdk-provider": "^0.4.5",
 
@@ -6,7 +6,7 @@ import { deserializeContext, serializeContext } from '#agent/agentSerialization'
 import type { RunAgentConfig } from '#agent/autonomous/autonomousAgentRunner';
 import { appContext } from '#app/applicationContext';
 import { LlmTools } from '#functions/llmTools';
-import { openaiGPT41 } from '#llm/services/openai';
+import { openaiGPT5 } from '#llm/services/openai';
 import type { AgentContext } from '#shared/agent/agent.model';
 import { functionRegistry } from '../functionRegistry';
 
@@ -19,10 +19,10 @@ describe('agentContext', () => {
 	describe('serialisation', () => {
 		it('should be be identical after serialisation and deserialization', async () => {
 			const llms = {
-				easy: openaiGPT41(),
-				medium: openaiGPT41(),
-				hard: openaiGPT41(),
-				xhard: openaiGPT41(),
+				easy: openaiGPT5(),
+				medium: openaiGPT5(),
+				hard: openaiGPT5(),
+				xhard: openaiGPT5(),
 			};
 			// We want to check that the FileSystem gets re-added by the resetFileSystemFunction function
 			const functions = new LlmFunctionsImpl(LlmTools); // FileSystemRead
 
@@ -4,15 +4,14 @@ import type { FunctionCallResult } from '#shared/llm/llm.model';
 import { envVar } from '#utils/env-var';
 
 /**
- * Runs the completionHandler on an agent
- * @param agent
+ * Executes the completion handler for a given agent. If the handler throws an error, it logs an error.
+ * @param agent - The agent context containing the completion handler to be invoked.
  */
 export async function runAgentCompleteHandler(agent: AgentContext): Promise<void> {
 	try {
 		await agent.completedHandler?.notifyCompleted(agent);
 	} catch (e) {
-		logger.warn(e, `Completion handler error for agent ${agent.agentId}`);
-		throw e;
+		logger.error(e, `Completion handler error for agent ${agent.agentId}`);
 	}
 }
 
 
@@ -383,10 +383,6 @@ async function checkRepoHomeAndWorkingDirectory(agent: AgentContext) {
 		agent.typedAiRepoDir = currentRepoDir;
 	}
 	const workingDir = fss.getWorkingDirectory();
-	logger.info({ workingDir }, 'Verifying working directory exists');
 	const workDirExists = await fss.directoryExists(workingDir);
-	if (!workDirExists) {
-		throw new Error(`Working directory ${workingDir} does not exist or is not a directory.`);
-	}
-	logger.info({ workingDir }, 'Working directory verified.');
+	if (!workDirExists) throw new Error(`Working directory ${workingDir} does not exist or is not a directory.`);
 }
@@ -6,7 +6,7 @@ import { MAD_Balanced, MAD_Fast, MAD_SOTA } from '#llm/multi-agent/reasoning-deb
 import { Claude4_1_Opus_Vertex } from '#llm/services/anthropic-vertex';
 import { cerebrasQwen3_235b_Thinking, cerebrasQwen3_Coder } from '#llm/services/cerebras';
 import { defaultLLMs } from '#llm/services/defaultLlms';
-import { openAIo3 } from '#llm/services/openai';
+import { openaiGPT5, openaiGPT5mini, openaiGPT5nano } from '#llm/services/openai';
 import { perplexityDeepResearchLLM, perplexityLLM, perplexityReasoningProLLM } from '#llm/services/perplexity-llm';
 import { xai_Grok4 } from '#llm/services/xai';
 import { logger } from '#o11y/logger';
@@ -21,7 +21,9 @@ export const LLM_CLI_ALIAS: Record<string, () => LLM> = {
 	f: cerebrasQwen3_235b_Thinking,
 	cc: cerebrasQwen3_Coder,
 	x: xai_Grok4,
-	o3: openAIo3,
+	g5: openaiGPT5,
+	g5m: openaiGPT5mini,
+	g5n: openaiGPT5nano,
 	madb: MAD_Balanced,
 	mads: MAD_SOTA,
 	madf: MAD_Fast,
 
@@ -1,7 +1,7 @@
 import '#fastify/trace-init/trace-init'; // leave an empty line next so this doesn't get sorted from the first line
 
 import { writeFileSync } from 'node:fs';
-import { initInMemoryApplicationContext } from '#app/applicationContext';
+import { initApplicationContext, initInMemoryApplicationContext } from '#app/applicationContext';
 import { ReasonerDebateLLM } from '#llm/multi-agent/reasoning-debate';
 import { defaultLLMs } from '#llm/services/defaultLlms';
 import { countTokens } from '#llm/tokens';
@@ -13,11 +13,13 @@ import { parsePromptWithImages } from './promptParser';
 // npm run gen
 
 async function main() {
-	await initInMemoryApplicationContext();
-
 	const { initialPrompt: rawPrompt, llmId, flags } = parseProcessArgs();
 	const { textPrompt, userContent } = parsePromptWithImages(rawPrompt);
 
+	// -s save to database
+	if (flags.s) await initApplicationContext();
+	else await initInMemoryApplicationContext();
+
 	let llm: LLM = defaultLLMs().medium;
 	if (llmId) {
 		if (!LLM_CLI_ALIAS[llmId]) {
 
@@ -74,7 +74,7 @@ export class Git implements VersionControlSystem {
 
 		// The fix is to execute a specific commit command that targets only the added files.
 		const commitResult = await execCommand(`git commit -m ${arg(commitMessage)} -- ${filesToAdd}`);
-		// Pre-commit hooks make call lint/commit commands with
+		// Pre-commit hooks may make call lint/commit commands with characters for colours etc
 		commitResult.stdout = formatAnsiWithMarkdownLinks(commitResult.stdout);
 		failOnError(`Failed to commit changes for files: ${files.join(', ')}`, commitResult);
 	}
 
@@ -1,7 +1,7 @@
 import { BaseLLM } from '#llm/base-llm';
 import { Claude4_Sonnet_Vertex } from '#llm/services/anthropic-vertex';
 import { fireworksLlama3_405B } from '#llm/services/fireworks';
-import { openaiGPT41 } from '#llm/services/openai';
+import { openaiGPT5 } from '#llm/services/openai';
 import { logger } from '#o11y/logger';
 import type { GenerateTextOptions, LLM } from '#shared/llm/llm.model';
 
@@ -65,7 +65,7 @@ const MIND_OVER_DATA_SYS_PROMPT = `When addressing a problem, employ "Comparativ
 `;
 
 export class Blackberry extends BaseLLM {
-	llms: LLM[] = [Claude4_Sonnet_Vertex(), openaiGPT41(), Claude4_Sonnet_Vertex()];
+	llms: LLM[] = [Claude4_Sonnet_Vertex(), openaiGPT5(), Claude4_Sonnet_Vertex()];
 	mediator: LLM = Claude4_Sonnet_Vertex();
 
 	constructor() {
 
@@ -4,7 +4,7 @@ import { FastMediumLLM } from '#llm/multi-agent/fastMedium';
 import { anthropicClaude4_Sonnet } from '#llm/services/anthropic';
 import { Claude4_1_Opus_Vertex, Claude4_Sonnet_Vertex } from '#llm/services/anthropic-vertex';
 import { deepinfraDeepSeekR1 } from '#llm/services/deepinfra';
-import { openAIo3 } from '#llm/services/openai';
+import { openaiGPT5 } from '#llm/services/openai';
 import { vertexGemini_2_5_Pro } from '#llm/services/vertexai';
 import { xai_Grok4 } from '#llm/services/xai';
 import { logger } from '#o11y/logger';
@@ -83,7 +83,7 @@ export function MAD_Balanced(): LLM {
 	return new ReasonerDebateLLM(
 		'Balanced',
 		vertexGemini_2_5_Pro,
-		[vertexGemini_2_5_Pro, xai_Grok4, openAIo3],
+		[vertexGemini_2_5_Pro, xai_Grok4, openaiGPT5],
 		'MAD:Balanced multi-agent debate (Gemini 2.5 Pro, Grok 4, o3)',
 	);
 }
@@ -92,7 +92,7 @@ export function MAD_Balanced4(): LLM {
 	return new ReasonerDebateLLM(
 		'Balanced4',
 		vertexGemini_2_5_Pro,
-		[vertexGemini_2_5_Pro, xai_Grok4, openAIo3, Claude4_Sonnet_Vertex],
+		[vertexGemini_2_5_Pro, xai_Grok4, openaiGPT5, Claude4_Sonnet_Vertex],
 		'MAD:Balanced multi-agent debate (Gemini 2.5 Pro, Grok 4, o3, Sonnet 4)',
 	);
 }
@@ -116,7 +116,7 @@ export function MAD_Anthropic(): LLM {
 }
 
 export function MAD_OpenAI(): LLM {
-	return new ReasonerDebateLLM('OpenAI', openAIo3, [openAIo3, openAIo3, openAIo3], 'MAD:OpenAI multi-agent debate (o3 x3)');
+	return new ReasonerDebateLLM('OpenAI', openaiGPT5, [openaiGPT5, openaiGPT5, openaiGPT5], 'MAD:OpenAI multi-agent debate (GPT5 x3)');
 }
 
 export function MAD_Grok(): LLM {
@@ -126,9 +126,9 @@ export function MAD_Grok(): LLM {
 export function MAD_SOTA(): LLM {
 	return new ReasonerDebateLLM(
 		'SOTA',
-		xai_Grok4,
-		[openAIo3, Claude4_1_Opus_Vertex, vertexGemini_2_5_Pro, xai_Grok4],
-		'MAD:SOTA multi-agent debate (Opus 4, o3, Gemini 2.5 Pro, Grok 4)',
+		openaiGPT5,
+		[openaiGPT5, Claude4_1_Opus_Vertex, vertexGemini_2_5_Pro, xai_Grok4],
+		'MAD:SOTA multi-agent debate (Opus 4, GPT5, Gemini 2.5 Pro, Grok 4)',
 	);
 }
Original file line number	Diff line number	Diff line change
`@@ -383,10 +383,6 @@ async function checkRepoHomeAndWorkingDirectory(agent: AgentContext) {`
`383`	`383`	`agent.typedAiRepoDir = currentRepoDir;`
`384`	`384`	`}`
`385`	`385`	`const workingDir = fss.getWorkingDirectory();`
`386`		`- logger.info({ workingDir }, 'Verifying working directory exists');`
`387`	`386`	`const workDirExists = await fss.directoryExists(workingDir);`
`388`		`- if (!workDirExists) {`
`389`		- throw new Error(`Working directory ${workingDir} does not exist or is not a directory.`);
`390`		`- }`
`391`		`- logger.info({ workingDir }, 'Working directory verified.');`
	`387`	+ if (!workDirExists) throw new Error(`Working directory ${workingDir} does not exist or is not a directory.`);
`392`	`388`	`}`
Original file line number	Diff line number	Diff line change
`@@ -74,7 +74,7 @@ export class Git implements VersionControlSystem {`
`74`	`74`
`75`	`75`	`// The fix is to execute a specific commit command that targets only the added files.`
`76`	`76`	const commitResult = await execCommand(`git commit -m ${arg(commitMessage)} -- ${filesToAdd}`);
`77`		`- // Pre-commit hooks make call lint/commit commands with`
	`77`	`+ // Pre-commit hooks may make call lint/commit commands with characters for colours etc`
`78`	`78`	`commitResult.stdout = formatAnsiWithMarkdownLinks(commitResult.stdout);`
`79`	`79`	failOnError(`Failed to commit changes for files: ${files.join(', ')}`, commitResult);
`80`	`80`	`}`