Debug Mode

InsightFactoryAPP · InsightFactoryAPP · commit a76ce262ee17 · 2025-09-07T01:22:49.000-04:00
diff --git a/tinyagent/code_agent/providers/base.py b/tinyagent/code_agent/providers/base.py
@@ -73,14 +73,16 @@ def __init__(
     async def execute_python(
         self, 
         code_lines: List[str], 
-        timeout: int = 120
+        timeout: int = 120,
+        debug_mode: bool = False
     ) -> Dict[str, Any]:
         """
         Execute Python code and return the result.
         
         Args:
             code_lines: List of Python code lines to execute
             timeout: Maximum execution time in seconds
+            debug_mode: Whether to print the executed code (useful for debugging)
             
         Returns:
             Dictionary containing execution results with keys:
diff --git a/tinyagent/code_agent/providers/bubblewrap_provider.py b/tinyagent/code_agent/providers/bubblewrap_provider.py
@@ -365,13 +365,14 @@ def _build_bubblewrap_command(
         
         return cmd
     
-    async def execute_python(self, code_lines: List[str], timeout: int = 120) -> Dict[str, Any]:
+    async def execute_python(self, code_lines: List[str], timeout: int = 120, debug_mode: bool = False) -> Dict[str, Any]:
         """
         Execute Python code within a bubblewrap sandbox and return the result.
         
         Args:
             code_lines: List of Python code lines to execute
             timeout: Maximum execution time in seconds
+            debug_mode: Whether to print the executed code (useful for debugging)
             
         Returns:
             Dictionary containing execution results
@@ -381,14 +382,16 @@ async def execute_python(self, code_lines: List[str], timeout: int = 120) -> Dic
         
         full_code = "\n".join(code_lines)
         
-        print("#" * 100)
-        print("##########################################code##########################################")
-        print(full_code)
-        print("#" * 100)
+        if debug_mode:
+            print("#" * 100)
+            print("##########################################code##########################################")
+            print(full_code)
+            print("#" * 100)
         
         # Prepare the full code with tools and default codes if needed
         if self.executed_default_codes:
-            print("✔️ default codes already executed")
+            if debug_mode:
+                print("✔️ default codes already executed")
             complete_code = "\n".join(self.code_tools_definitions) + "\n\n" + full_code
         else:
             complete_code = "\n".join(self.code_tools_definitions) + "\n\n" + "\n".join(self.default_python_codes) + "\n\n" + full_code
@@ -687,7 +690,7 @@ def _sanitize_state_dict(d):
                     result["error"] = f"Process exited with code {process.returncode}"
                 
                 # Log the response
-                self._log_response(result)
+                self._log_response(result, debug_mode)
                 
                 return clean_response(result)
             
@@ -724,29 +727,30 @@ def _sanitize_state_dict(d):
             except Exception:
                 pass
     
-    def _log_response(self, response: Dict[str, Any]):
+    def _log_response(self, response: Dict[str, Any], debug_mode: bool = False):
         """Log the response from code execution."""
-        print("######################### BUBBLEWRAP EXECUTION #########################")
-        print("#########################<printed_output>#########################")
-        print(response["printed_output"])
-        print("#########################</printed_output>#########################")
-        if response.get("return_value", None) not in [None, ""]:
-            print("#########################<return_value>#########################")
-            print(response["return_value"])
-            print("#########################</return_value>#########################")
-        if response.get("stderr", None) not in [None, ""]:
-            print("#########################<stderr>#########################")
-            print(response["stderr"])
-            print("#########################</stderr>#########################")
-        if response.get("error_traceback", None) not in [None, ""]:
-            print("#########################<traceback>#########################")
-            # Check if this is a security exception and highlight it in red if so
-            error_text = response["error_traceback"]
-            if "SECURITY" in error_text:
-                print(f"{COLOR['RED']}{error_text}{COLOR['ENDC']}")
-            else:
-                print(error_text)
-            print("#########################</traceback>#########################")
+        if debug_mode:
+            print("######################### BUBBLEWRAP EXECUTION #########################")
+            print("#########################<printed_output>#########################")
+            print(response["printed_output"])
+            print("#########################</printed_output>#########################")
+            if response.get("return_value", None) not in [None, ""]:
+                print("#########################<return_value>#########################")
+                print(response["return_value"])
+                print("#########################</return_value>#########################")
+            if response.get("stderr", None) not in [None, ""]:
+                print("#########################<stderr>#########################")
+                print(response["stderr"])
+                print("#########################</stderr>#########################")
+            if response.get("error_traceback", None) not in [None, ""]:
+                print("#########################<traceback>#########################")
+                # Check if this is a security exception and highlight it in red if so
+                error_text = response["error_traceback"]
+                if "SECURITY" in error_text:
+                    print(f"{COLOR['RED']}{error_text}{COLOR['ENDC']}")
+                else:
+                    print(error_text)
+                print("#########################</traceback>#########################")
     
     def _quote_command_for_shell(self, command: List[str]) -> str:
         """
@@ -862,7 +866,7 @@ async def _prepare_git_sandbox_command(self, command: List[str]) -> List[str]:
 # Check if it's a GitHub URL
 if [[ "$REMOTE_URL" == *"github.com"* ]]; then
     # Extract the repo path from the URL
-    REPO_PATH=$(echo "$REMOTE_URL" | sed -E 's|https://[^/]*github\.com/||' | sed -E 's|git@github\.com:||' | sed 's|\.git$||')
+    REPO_PATH=$(echo "$REMOTE_URL" | sed -E 's|https://[^/]*github\\.com/||' | sed -E 's|git@github\\.com:||' | sed 's|\\.git$||')
     
     # Set the remote URL with the token
     git remote set-url {remote_name} "https://{github_username}:{github_token}@github.com/$REPO_PATH.git"
diff --git a/tinyagent/code_agent/providers/docker_provider.py b/tinyagent/code_agent/providers/docker_provider.py
@@ -548,13 +548,14 @@ def get_environment_variables(self) -> Dict[str, str]:
         """
         return self.environment_variables.copy()
     
-    async def execute_python(self, code_lines: List[str], timeout: int = 120) -> Dict[str, Any]:
+    async def execute_python(self, code_lines: List[str], timeout: int = 120, debug_mode: bool = False) -> Dict[str, Any]:
         """
         Execute Python code within a Docker container and return the result.
         
         Args:
             code_lines: List of Python code lines to execute
             timeout: Maximum execution time in seconds
+            debug_mode: Whether to print the executed code (useful for debugging)
             
         Returns:
             Dictionary containing execution results
@@ -564,14 +565,16 @@ async def execute_python(self, code_lines: List[str], timeout: int = 120) -> Dic
         
         full_code = "\n".join(code_lines)
         
-        print("#" * 100)
-        print("##########################################code##########################################")
-        print(full_code)
-        print("#" * 100)
+        if debug_mode:
+            print("#" * 100)
+            print("##########################################code##########################################")
+            print(full_code)
+            print("#" * 100)
         
         # Prepare the full code with tools and default codes if needed
         if self.executed_default_codes:
-            print("✔️ default codes already executed")
+            if debug_mode:
+                print("✔️ default codes already executed")
             complete_code = "\n".join(self.code_tools_definitions) + "\n\n" + full_code
         else:
             complete_code = "\n".join(self.code_tools_definitions) + "\n\n" + "\n".join(self.default_python_codes) + "\n\n" + full_code
@@ -697,7 +700,7 @@ async def execute_python(self, code_lines: List[str], timeout: int = 120) -> Dic
                     result["error"] = f"Process exited with code {process.returncode}"
                 
                 # Log the response
-                self._log_response(result)
+                self._log_response(result, debug_mode)
                 
                 return clean_response(result)
             
@@ -953,29 +956,30 @@ def _sanitize_state_dict(d):
 print(json.dumps(cleaned_result))
 """
     
-    def _log_response(self, response: Dict[str, Any]):
+    def _log_response(self, response: Dict[str, Any], debug_mode: bool = False):
         """Log the response from code execution."""
-        print("######################### DOCKER EXECUTION #########################")
-        print("#########################<printed_output>#########################")
-        print(response["printed_output"])
-        print("#########################</printed_output>#########################")
-        if response.get("return_value", None) not in [None, ""]:
-            print("#########################<return_value>#########################")
-            print(response["return_value"])
-            print("#########################</return_value>#########################")
-        if response.get("stderr", None) not in [None, ""]:
-            print("#########################<stderr>#########################")
-            print(response["stderr"])
-            print("#########################</stderr>#########################")
-        if response.get("error_traceback", None) not in [None, ""]:
-            print("#########################<traceback>#########################")
-            # Check if this is a security exception and highlight it in red if so
-            error_text = response["error_traceback"]
-            if "SECURITY" in error_text:
-                print(f"{COLOR['RED']}{error_text}{COLOR['ENDC']}")
-            else:
-                print(error_text)
-            print("#########################</traceback>#########################")
+        if debug_mode:
+            print("######################### DOCKER EXECUTION #########################")
+            print("#########################<printed_output>#########################")
+            print(response["printed_output"])
+            print("#########################</printed_output>#########################")
+            if response.get("return_value", None) not in [None, ""]:
+                print("#########################<return_value>#########################")
+                print(response["return_value"])
+                print("#########################</return_value>#########################")
+            if response.get("stderr", None) not in [None, ""]:
+                print("#########################<stderr>#########################")
+                print(response["stderr"])
+                print("#########################</stderr>#########################")
+            if response.get("error_traceback", None) not in [None, ""]:
+                print("#########################<traceback>#########################")
+                # Check if this is a security exception and highlight it in red if so
+                error_text = response["error_traceback"]
+                if "SECURITY" in error_text:
+                    print(f"{COLOR['RED']}{error_text}{COLOR['ENDC']}")
+                else:
+                    print(error_text)
+                print("#########################</traceback>#########################")
     
     def _quote_command_for_shell(self, command: List[str]) -> str:
         """
diff --git a/tinyagent/code_agent/providers/modal_provider.py b/tinyagent/code_agent/providers/modal_provider.py
@@ -163,13 +163,14 @@ def _setup_modal_app(self):
         if self.code_tools:
             self.add_tools(self.code_tools)
     
-    async def execute_python(self, code_lines: List[str], timeout: int = 120) -> Dict[str, Any]:
+    async def execute_python(self, code_lines: List[str], timeout: int = 120, debug_mode: bool = False) -> Dict[str, Any]:
         """
         Execute Python code using Modal's native .local() or .remote() methods.
         
         Args:
             code_lines: List of Python code lines to execute
             timeout: Maximum execution time in seconds
+            debug_mode: Whether to print the executed code (useful for debugging)
             
         Returns:
             Dictionary containing execution results
@@ -179,10 +180,11 @@ async def execute_python(self, code_lines: List[str], timeout: int = 120) -> Dic
         
         full_code = "\n".join(code_lines)
         
-        print("#" * 100)
-        print("##########################################code##########################################")
-        print(full_code)
-        print("#" * 100)
+        if debug_mode:
+            print("#" * 100)
+            print("##########################################code##########################################")
+            print(full_code)
+            print("#" * 100)
 
         
         # Use Modal's native execution methods
@@ -303,7 +305,8 @@ def _python_executor(self, code: str, globals_dict: Dict[str, Any] = None, local
         
         # Prepare the full code with default codes if needed
         if self.executed_default_codes:
-            print("✔️ default codes already executed")
+            if debug_mode:
+                print("✔️ default codes already executed")
             full_code = "\n".join(self.code_tools_definitions) +"\n\n"+code
             # Code tools and default code are trusted, user code is not
         else:
diff --git a/tinyagent/code_agent/providers/seatbelt_provider.py b/tinyagent/code_agent/providers/seatbelt_provider.py
@@ -375,13 +375,14 @@ def _write_seatbelt_profile_to_temp_file(self):
                 self.logger.error("Failed to write seatbelt profile to temporary file: %s", str(e))
             raise RuntimeError(f"Failed to write seatbelt profile: {str(e)}")
     
-    async def execute_python(self, code_lines: List[str], timeout: int = 120) -> Dict[str, Any]:
+    async def execute_python(self, code_lines: List[str], timeout: int = 120, debug_mode: bool = False) -> Dict[str, Any]:
         """
         Execute Python code within a sandbox and return the result.
         
         Args:
             code_lines: List of Python code lines to execute
             timeout: Maximum execution time in seconds
+            debug_mode: Whether to print the executed code (useful for debugging)
             
         Returns:
             Dictionary containing execution results
@@ -391,14 +392,16 @@ async def execute_python(self, code_lines: List[str], timeout: int = 120) -> Dic
         
         full_code = "\n".join(code_lines)
         
-        print("#" * 100)
-        print("##########################################code##########################################")
-        print(full_code)
-        print("#" * 100)
+        if debug_mode:
+            print("#" * 100)
+            print("##########################################code##########################################")
+            print(full_code)
+            print("#" * 100)
         
         # Prepare the full code with tools and default codes if needed
         if self.executed_default_codes:
-            print("✔️ default codes already executed")
+            if debug_mode:
+                print("✔️ default codes already executed")
             complete_code = "\n".join(self.code_tools_definitions) + "\n\n" + full_code
         else:
             complete_code = "\n".join(self.code_tools_definitions) + "\n\n" + "\n".join(self.default_python_codes) + "\n\n" + full_code
@@ -701,7 +704,7 @@ def _sanitize_state_dict(d):
                     result["error"] = f"Process exited with code {process.returncode}"
                 
                 # Log the response
-                self._log_response(result)
+                self._log_response(result, debug_mode)
                 
                 return clean_response(result)
             
@@ -738,29 +741,30 @@ def _sanitize_state_dict(d):
             except Exception:
                 pass
     
-    def _log_response(self, response: Dict[str, Any]):
+    def _log_response(self, response: Dict[str, Any], debug_mode: bool = False):
         """Log the response from code execution."""
-        print("######################### SEATBELT EXECUTION #########################")
-        print("#########################<printed_output>#########################")
-        print(response["printed_output"])
-        print("#########################</printed_output>#########################")
-        if response.get("return_value", None) not in [None, ""]:
-            print("#########################<return_value>#########################")
-            print(response["return_value"])
-            print("#########################</return_value>#########################")
-        if response.get("stderr", None) not in [None, ""]:
-            print("#########################<stderr>#########################")
-            print(response["stderr"])
-            print("#########################</stderr>#########################")
-        if response.get("error_traceback", None) not in [None, ""]:
-            print("#########################<traceback>#########################")
-            # Check if this is a security exception and highlight it in red if so
-            error_text = response["error_traceback"]
-            if "SECURITY" in error_text:
-                print(f"{COLOR['RED']}{error_text}{COLOR['ENDC']}")
-            else:
-                print(error_text)
-            print("#########################</traceback>#########################")
+        if debug_mode:
+            print("######################### SEATBELT EXECUTION #########################")
+            print("#########################<printed_output>#########################")
+            print(response["printed_output"])
+            print("#########################</printed_output>#########################")
+            if response.get("return_value", None) not in [None, ""]:
+                print("#########################<return_value>#########################")
+                print(response["return_value"])
+                print("#########################</return_value>#########################")
+            if response.get("stderr", None) not in [None, ""]:
+                print("#########################<stderr>#########################")
+                print(response["stderr"])
+                print("#########################</stderr>#########################")
+            if response.get("error_traceback", None) not in [None, ""]:
+                print("#########################<traceback>#########################")
+                # Check if this is a security exception and highlight it in red if so
+                error_text = response["error_traceback"]
+                if "SECURITY" in error_text:
+                    print(f"{COLOR['RED']}{error_text}{COLOR['ENDC']}")
+                else:
+                    print(error_text)
+                print("#########################</traceback>#########################")
     
     
     def _quote_command_for_shell(self, command: List[str]) -> str:
@@ -915,7 +919,7 @@ async def _prepare_git_sandbox_command(self, command: List[str]) -> List[str]:
 # Check if it's a GitHub URL
 if [[ "$REMOTE_URL" == *"github.com"* ]]; then
     # Extract the repo path from the URL
-    REPO_PATH=$(echo "$REMOTE_URL" | sed -E 's|https://[^/]*github\.com/||' | sed -E 's|git@github\.com:||' | sed 's|\.git$||')
+    REPO_PATH=$(echo "$REMOTE_URL" | sed -E 's|https://[^/]*github\\.com/||' | sed -E 's|git@github\\.com:||' | sed 's|\\.git$||')
     
     # Set the remote URL with the token
     git remote set-url {remote_name} "https://{github_username}:{github_token}@github.com/$REPO_PATH.git"
diff --git a/tinyagent/code_agent/tiny_code_agent.py b/tinyagent/code_agent/tiny_code_agent.py