Prompt refactor for planner agent (ml-commons)

yyfamazon · yyfamazon · commit d4d3ac983cb8 · 2026-05-27T18:21:38.000+08:00
Signed-off-by: yyfamazon &lt;yyf@amazon.com&gt;
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/agent/MLPlanExecuteAndReflectAgentRunner.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/agent/MLPlanExecuteAndReflectAgentRunner.java
@@ -34,14 +34,15 @@
 import static org.opensearch.ml.engine.algorithms.agent.MLChatAgentRunner.saveTraceData;
 import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.DEFAULT_PLANNER_PROMPT;
 import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.DEFAULT_PLANNER_PROMPT_TEMPLATE;
+import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.DEFAULT_PLANNER_SYSTEM_PROMPT_PREFIX;
 import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.DEFAULT_PLANNER_WITH_HISTORY_PROMPT_TEMPLATE;
 import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.DEFAULT_REFLECT_PROMPT;
 import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.DEFAULT_REFLECT_PROMPT_TEMPLATE;
 import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.EXECUTOR_RESPONSIBILITY;
 import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.FINAL_RESULT_RESPONSE_INSTRUCTIONS;
 import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.MAX_STEP_SUMMARY_PER_SYSTEM_PROMPT;
-import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.PLANNER_RESPONSIBILITY;
-import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.PLAN_EXECUTE_REFLECT_RESPONSE_FORMAT;
+import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.getCorePlanningInstructions;
+import static org.opensearch.ml.engine.algorithms.agent.PromptTemplate.getPlanExecuteReflectResponseFormat;
 
 import java.util.ArrayList;
 import java.util.HashMap;
@@ -120,8 +121,8 @@ public class MLPlanExecuteAndReflectAgentRunner implements MLAgentRunner {
     private String plannerWithHistoryPromptTemplate;
 
     @VisibleForTesting
-    static final String DEFAULT_PLANNER_SYSTEM_PROMPT = PLANNER_RESPONSIBILITY + PLAN_EXECUTE_REFLECT_RESPONSE_FORMAT
-        + FINAL_RESULT_RESPONSE_INSTRUCTIONS;
+    static final String DEFAULT_PLANNER_SYSTEM_PROMPT = DEFAULT_PLANNER_SYSTEM_PROMPT_PREFIX + getCorePlanningInstructions()
+        + getPlanExecuteReflectResponseFormat() + FINAL_RESULT_RESPONSE_INSTRUCTIONS;
 
     @VisibleForTesting
     static final String DEFAULT_EXECUTOR_SYSTEM_PROMPT = EXECUTOR_RESPONSIBILITY;
@@ -141,6 +142,9 @@ public class MLPlanExecuteAndReflectAgentRunner implements MLAgentRunner {
     public static final String PLAN_EXECUTE_REFLECT_RESPONSE_FORMAT_FIELD = "plan_execute_reflect_response_format";
     public static final String PROMPT_TEMPLATE_FIELD = "prompt_template";
     public static final String SYSTEM_PROMPT_FIELD = "system_prompt";
+    public static final String RESULT_EXPAND_OVERRIDE = "result_expand_and_override";
+    public static final String IMPORTANT_RULES_EXPAND = "important_rules_expand";
+    public static final String PLANNER_SYSTEM_PROMPT_PREFIX = "planner_system_prompt_prefix";
     public static final String QUESTION_FIELD = "question";
     public static final String MEMORY_ID_FIELD = "memory_id";
     public static final String PARENT_INTERACTION_ID_FIELD = "parent_interaction_id";
@@ -199,23 +203,38 @@ public MLPlanExecuteAndReflectAgentRunner(
     }
 
     @VisibleForTesting
-    void setupPromptParameters(Map<String, String> params) {
+    void setupPromptParameters(Map<String, String> params, boolean injectDate, String currentDateTime) {
         // populated depending on whether LLM is asked to plan or re-evaluate
         // removed here, so that error is thrown in case this field is not populated
         params.remove(PROMPT_FIELD);
 
         String userPrompt = params.get(QUESTION_FIELD);
         params.put(USER_PROMPT_FIELD, userPrompt);
 
-        boolean injectDate = Boolean.parseBoolean(params.getOrDefault(INJECT_DATETIME_FIELD, "false"));
-        String dateFormat = params.get(DATETIME_FORMAT_FIELD);
-        String currentDateTime = injectDate ? getCurrentDateTime(dateFormat) : "";
+        String clientBusinessPrompt = params.get(SYSTEM_PROMPT_FIELD);
 
-        String plannerSystemPrompt = params.getOrDefault(SYSTEM_PROMPT_FIELD, DEFAULT_PLANNER_SYSTEM_PROMPT);
-        if (injectDate) {
-            plannerSystemPrompt = String.format("%s\n\n%s", plannerSystemPrompt, currentDateTime);
+        if (clientBusinessPrompt != null && !clientBusinessPrompt.isEmpty()) { // Replace the whole prompt if client specifies system prompt template
+            params.put(SYSTEM_PROMPT_FIELD, clientBusinessPrompt);
+        } else { // Using the default system prompt template if client does not specify.
+            params.put(SYSTEM_PROMPT_FIELD, DEFAULT_PLANNER_SYSTEM_PROMPT);
+        }
+
+        String resultExpandOverride = params.get(RESULT_EXPAND_OVERRIDE);
+        String importantRulesExpand = params.get(IMPORTANT_RULES_EXPAND);
+        String plannerSystemPromptPrefix = params.getOrDefault(PLANNER_SYSTEM_PROMPT_PREFIX, DEFAULT_PLANNER_SYSTEM_PROMPT_PREFIX);
+
+        // Append / mutate the system prompt through these 3 parameters: plannerSystemPromptPrefix, resultExpandOverride and importantRulesExpand
+        if (plannerSystemPromptPrefix != null && !plannerSystemPromptPrefix.isEmpty()
+                && resultExpandOverride != null && !resultExpandOverride.isEmpty()
+                && importantRulesExpand != null && !importantRulesExpand.isEmpty()) {
+            StringBuilder stringBuilder = new StringBuilder();
+            stringBuilder.append(plannerSystemPromptPrefix).append("\n");
+            stringBuilder.append(getCorePlanningInstructions()).append("\n");
+            stringBuilder.append(getPlanExecuteReflectResponseFormat(resultExpandOverride, importantRulesExpand));
+            String finalPlannerPrompt = stringBuilder.toString();
+
+            params.put(SYSTEM_PROMPT_FIELD, finalPlannerPrompt);
         }
-        params.put(SYSTEM_PROMPT_FIELD, plannerSystemPrompt);
 
         String executorSystemPrompt = params.getOrDefault(EXECUTOR_SYSTEM_PROMPT_FIELD, DEFAULT_EXECUTOR_SYSTEM_PROMPT);
         if (injectDate) {
@@ -245,7 +264,7 @@ void setupPromptParameters(Map<String, String> params) {
             this.plannerWithHistoryPromptTemplate = params.get(PLANNER_WITH_HISTORY_TEMPLATE_FIELD);
         }
 
-        params.put(PLAN_EXECUTE_REFLECT_RESPONSE_FORMAT_FIELD, PLAN_EXECUTE_REFLECT_RESPONSE_FORMAT);
+        params.put(PLAN_EXECUTE_REFLECT_RESPONSE_FORMAT_FIELD, getPlanExecuteReflectResponseFormat());
 
         params.put(NO_ESCAPE_PARAMS_FIELD, DEFAULT_NO_ESCAPE_PARAMS);
 
@@ -264,8 +283,12 @@ void setupPromptParameters(Map<String, String> params) {
     }
 
     @VisibleForTesting
-    void usePlannerPromptTemplate(Map<String, String> params) {
-        params.put(PROMPT_TEMPLATE_FIELD, this.plannerPromptTemplate);
+    void usePlannerPromptTemplate(Map<String, String> params, boolean injectDate, String currentDateTime) {
+        String template = this.plannerPromptTemplate;
+        if (injectDate) {
+            template = template + "\n\n" + currentDateTime;
+        }
+        params.put(PROMPT_TEMPLATE_FIELD, template);
         populatePrompt(params);
     }
 
@@ -297,10 +320,14 @@ public void run(MLAgent mlAgent, Map<String, String> apiParams, ActionListener<O
         allParams.put(TENANT_ID_FIELD, mlAgent.getTenantId());
         log.debug("MLPlanExecuteAndReflectAgentRunner called with allParams: {}", allParams);
 
-        setupPromptParameters(allParams);
+        boolean injectDate = Boolean.parseBoolean(allParams.getOrDefault(INJECT_DATETIME_FIELD, "false"));
+        String dateFormat = allParams.get(DATETIME_FORMAT_FIELD);
+        String currentDateTime = injectDate ? getCurrentDateTime(dateFormat) : "";
+
+        setupPromptParameters(allParams, injectDate, currentDateTime);
 
         // planner prompt for the first call
-        usePlannerPromptTemplate(allParams);
+        usePlannerPromptTemplate(allParams, injectDate, currentDateTime);
 
         // Token tracking: resolve model metadata, then proceed with memory setup and execution.
         String llmModelId = mlAgent.getLlm().getModelId();
diff --git a/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/agent/PromptTemplate.java b/ml-algorithms/src/main/java/org/opensearch/ml/engine/algorithms/agent/PromptTemplate.java
@@ -81,51 +81,75 @@ public class PromptTemplate {
                 6. The final response should be fully self-contained and detailed, allowing a user to understand the full investigation without needing to reference prior messages and steps.
             """;
 
-    public static final String PLAN_EXECUTE_REFLECT_RESPONSE_FORMAT = "Response Instructions: \n"
-        + "Only respond in JSON format. Always follow the given response instructions. Do not return any content that does not follow the response instructions. Do not add anything before or after the expected JSON. \n"
-        + "Always respond with a valid JSON object that strictly follows the below schema:\n"
-        + "{\n"
-        + "\t\"steps\": array[string], \n"
-        + "\t\"result\": string \n"
-        + "}\n"
-        + "Use \"steps\" to return an array of strings where each string is a step to complete the objective, leave it empty if you know the final result. Please wrap each step in quotes and escape any special characters within the string. \n"
-        + "Use \"result\" return the final response when you have enough information, leave it empty if you want to execute more steps. Please escape any special characters within the result. \n"
-        + "Here are examples of valid responses following the required JSON schema:\n\n"
-        + "Example 1 - When you need to execute steps:\n"
-        + "{\n"
-        + "\t\"steps\": [\"This is an example step\", \"this is another example step\"],\n"
-        + "\t\"result\": \"\"\n"
-        + "}\n\n"
-        + "Example 2 - When you have the final result:\n"
-        + "{\n"
-        + "\t\"steps\": [],\n"
-        + "\t\"result\": \"This is an example result\\n with escaped special characters\"\n"
-        + "}\n"
-        + "Important rules for the response:\n"
-        + "1. Do not use commas within individual steps \n"
-        + "2. Do not add any content before or after the JSON \n"
-        + "3. Only respond with a pure JSON object \n\n";
-
-    public static final String PLANNER_RESPONSIBILITY =
-        """
-            You are a thoughtful and analytical planner agent in a plan-execute-reflect framework. Your job is to design a clear, step-by-step plan for a given objective.
-
-            Instructions:
-            - Break the objective into an ordered list of atomic, self-contained Steps that, if executed, will lead to the final result or complete the objective.
-            - Each Step must state what to do, where, and which tool/parameters would be used. You do not execute tools, only reference them for planning.
-            - Use only the provided tools; do not invent or assume tools. If no suitable tool applies, use reasoning or observations instead.
-            - Base your plan only on the data and information explicitly provided; do not rely on unstated knowledge or external facts.
-            - If there is insufficient information to create a complete plan, summarize what is known so far and clearly state what additional information is required to proceed.
-            - Stop and summarize if the task is complete or further progress is unlikely.
-            - Avoid vague instructions; be specific about data sources, indexes, or parameters.
-            - Never make assumptions or rely on implicit knowledge.
-            - Respond only in JSON format.
-
-            Step examples:
-            Good example: \"Use Tool to sample documents from index: 'my-index'\"
-            Bad example: \"Use Tool to sample documents from each index\"
-            Bad example: \"Use Tool to sample documents from all indices\"
-            """;
+    public static String getPlanExecuteReflectResponseFormat(String resultExpandAndOverride, String importantRulesExpand) {
+        String resultExample = "Here are examples of valid responses following the required JSON schema:\n\n"
+            + "Example 1 - When you need to execute steps:\n"
+            + "{\n"
+            + "\t\"steps\": [\"This is an example step\", \"this is another example step\"],\n"
+            + "\t\"result\": \"\"\n"
+            + "}\n\n"
+            + "Example 2 - When you have the final result:\n"
+            + "{\n"
+            + "\t\"steps\": [],\n"
+            + "\t\"result\": \"This is an example result\\n with escaped special characters\"\n"
+            + "}\n";
+
+        return "# Response Format\n\n"
+            + "## JSON Response Requirements\n"
+            + "Only respond in JSON format. Always follow the given response instructions. Do not return any content that does not follow the response instructions. Do not add anything before or after the expected JSON\n\n"
+            + "Always respond with a valid JSON object that strictly follows the below schema:\n"
+            + "```json\n"
+            + "{\n"
+            + "  \"steps\": array[string],\n"
+            + "  \"result\": string\n"
+            + "}\n"
+            + "```\n"
+            + "\n"
+            + "- Use \"steps\" to return an array of strings where each string is a step to complete the objective, leave it empty if you know the final result. Please wrap each step in quotes and escape any special characters within the string\n"
+            + "- Use \"result\" to return the final response when you have enough information, leave it empty if you want to execute more steps. "
+            + (resultExpandAndOverride == null ? "" : resultExpandAndOverride)
+            + "\n"
+            + (resultExpandAndOverride == null ? resultExample : "")
+            + "## Critical Rules\n"
+            + "1. Do not use commas within individual steps\n"
+            + "2. Do not add any content before or after the JSON\n"
+            + "3. Only respond with a pure JSON object\n"
+            + (importantRulesExpand == null ? "" : importantRulesExpand)
+            + "\n";
+    }
+
+    public static String getPlanExecuteReflectResponseFormat() {
+        return getPlanExecuteReflectResponseFormat(null, null);
+    }
+
+    public static final String DEFAULT_PLANNER_SYSTEM_PROMPT_PREFIX =
+        "# Investigation Planner Agent\n\nYou are a thoughtful and analytical planner agent in a plan-execute-reflect framework. Your job is to design a clear, step-by-step plan for a given objective.\n\n";
+
+    public static String getCorePlanningInstructions() {
+        return """
+            # Instructions
+
+            ## Core Planning Rules
+            - Break the objective into an ordered list of atomic, self-contained Steps that, if executed, will lead to the final result or complete the objective
+            - Each Step must state what to do, where, and which tool/parameters would be used. You do not execute tools, only reference them for planning
+            - Use only the provided tools; do not invent or assume tools. If no suitable tool applies, use reasoning or observations instead
+            - Base your plan only on the data and information explicitly provided; do not rely on unstated knowledge or external facts
+            - If there is insufficient information to create a complete plan, summarize what is known so far and clearly state what additional information is required to proceed
+            - Stop and summarize if the task is complete or further progress is unlikely
+            - Avoid vague instructions; be specific about data sources, indexes, or parameters
+            - Never make assumptions or rely on implicit knowledge
+            - Respond only in JSON format
+            """
+            + """
+                ## Step Examples
+                **Good example:** "Use Tool to sample documents from index: 'my-index'"
+
+                **Bad example:** "Use Tool to sample documents from each index"
+
+                **Bad example:** "Use Tool to sample documents from all indices"
+
+                """;
+    }
 
     public static final String EXECUTOR_RESPONSIBILITY =
         """
diff --git a/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/agent/MLPlanExecuteAndReflectAgentRunnerTest.java b/ml-algorithms/src/test/java/org/opensearch/ml/engine/algorithms/agent/MLPlanExecuteAndReflectAgentRunnerTest.java