generative-computing · akihikokuroda · May 8, 2026 · May 8, 2026 · May 11, 2026 · May 11, 2026
@@ -0,0 +1,238 @@
+# pytest: e2e, qualitative
+"""Example usage patterns for bash_executor and unsafe_local_bash_executor tools.
+
+Demonstrates multiple ways to use Mellea's bash execution capabilities:
+1. Direct execution for non-LLM tasks
+2. Wrapping as a MelleaTool for agent use
+3. LLM-based tool calling with forced tool use
+4. Integration with error handling
+
+⚠️  Security note: bash_executor uses Docker isolation via llm-sandbox (recommended
+for production and LLM-generated code). unsafe_local_bash_executor runs commands
+directly with no isolation (development/testing only with trusted code).
+Both enforce a conservative safety denylist: no sudo, no rm -rf, no destructive
+git operations, no writes to /etc, /sys, /proc, etc. Write operations can also
+be constrained with ``working_dir`` and explicit ``allowed_paths``.
+
+Note: Commands must use argv-friendly syntax (no pipes, redirects, or shell builtins).
+Use individual commands and compose them in Python instead.
+"""
+
+from mellea import MelleaSession, start_session
+from mellea.backends import ModelOption
+from mellea.backends.tools import MelleaTool
+from mellea.stdlib.requirements import uses_tool
+from mellea.stdlib.tools.shell import bash_executor, unsafe_local_bash_executor
+
+
+def example_1_direct_execution() -> None:
+    """Example 1: Execute bash commands directly."""
+    print("=== Example 1: Direct Execution ===")
+
+    # Execute a simple command
+    result = unsafe_local_bash_executor("echo 'Hello from Bash'")
+    print("Command: echo 'Hello from Bash'")
+    print(f"Success: {result.success}")
+    print(f"Output: {result.stdout}")
+    print()
+
+    # Execute a command to list files (no pipes/redirects)
+    result = unsafe_local_bash_executor("ls -la")
+    print("Command: ls -la")
+    print(f"Success: {result.success}")
+    if result.stdout:
+        # Show first few lines
+        lines = result.stdout.split("\n")[:3]
+        print("Output (first 3 lines):\n" + "\n".join(lines))
+    print()
+
+    # Demonstrate that pipes are blocked (for security)
+    result = unsafe_local_bash_executor("ls -la | wc -l")
+    print("Command: ls -la | wc -l (pipe operator blocked)")
+    print(f"Rejected: {result.skipped}")
+    print(f"Reason: {result.skip_message}")
+    print()
+
+    # Attempt a dangerous command (will be rejected)
+    result = unsafe_local_bash_executor("sudo echo unsafe")
+    print("Command: sudo echo unsafe")
+    print(f"Skipped: {result.skipped}")
+    print(f"Reason: {result.skip_message}")
+    print()
+
+
+def example_2_wrapped_as_tool() -> None:
+    """Example 2: Wrap bash executor as a MelleaTool for LLM use."""
+    print("=== Example 2: Wrapped as MelleaTool ===")
+
+    # Create tool from bash executor
+    bash_tool = MelleaTool.from_callable(unsafe_local_bash_executor)
+    print(f"Tool name: {bash_tool.name}")
+    print(f"Tool schema keys: {bash_tool.as_json_tool.keys()}")
+    print()
+
+    # Invoke the tool directly (normally LLM would call this)
+    result = bash_tool.run("pwd")
+    print("Tool invocation result:")
+    print(f"  Success: {result.success}")
+    print(f"  Output: {result.stdout}")
+    print()
+
+
+def example_3_llm_with_forced_tool_use(m: MelleaSession) -> None:
+    """Example 3: LLM generates bash commands with forced tool use (requires Ollama).
+
+    This mirrors the Python interpreter pattern: ask the LLM to generate
+    a bash command, force it to use the tool, then execute the command.
+
+    Requirements:
+        - Ollama running locally (or compatible LLM configured)
+        - Run: ollama serve
+    """
+    print("=== Example 3: LLM-Generated Bash Commands with Forced Tool Use ===")
+
+    result = m.instruct(
+        description="Use bash to count how many Python files are in the current directory.",
+        requirements=[uses_tool(unsafe_local_bash_executor)],
+        model_options={
+            ModelOption.TOOLS: [MelleaTool.from_callable(unsafe_local_bash_executor)]
+        },
+        tool_calls=True,
+    )
+
+    if result.tool_calls is None:
+        raise ValueError("Expected tool_calls but got None")
+
+    if "unsafe_local_bash_executor" not in result.tool_calls:
+        available_tools = list(result.tool_calls.keys())
+        raise ValueError(
+            f"Expected tool 'unsafe_local_bash_executor' in tool_calls, "
+            f"but got: {available_tools}"
+        )
+
+    # Extract the bash command the LLM generated
+    tool_call = result.tool_calls["unsafe_local_bash_executor"]
+    if "command" not in tool_call.args:
+        raise ValueError(
+            f"Expected 'command' argument in tool call args, "
+            f"but got: {list(tool_call.args.keys())}"
+        )
+
+    command = tool_call.args["command"]
+    print(f"LLM generated bash command:\n  {command}\n")
+
+    # Execute the command
+    exec_result = tool_call.call_func()
+
+    print("Execution result:")
+    print(f"  Success: {exec_result.success}")
+    print(f"  Skipped: {exec_result.skipped}")
+    if exec_result.skip_message:
+        print(f"  Skip reason: {exec_result.skip_message}")
+    print(f"  Output: {exec_result.stdout}")
+    if exec_result.stderr:
+        print(f"  Error: {exec_result.stderr}")
+    print()
+
+
+def example_3_with_working_dir() -> None:
+    """Example 3: Restrict write validation and execution cwd to a directory."""
+    print("=== Example 3: Working Directory Restriction ===")
+
+    import os
+    import tempfile
+
+    with tempfile.TemporaryDirectory() as tmpdir:
+        print(f"Working directory: {tmpdir}")
+
+        # Create a file using touch within the working directory (redirects blocked)
+        result = unsafe_local_bash_executor("touch myfile.txt", working_dir=tmpdir)
+        print(f"Command: touch myfile.txt (relative path, executed in {tmpdir})")
+        print(f"Success: {result.success}")
+        print()
+
+        # Verify the file was created
+        file_path = os.path.join(tmpdir, "myfile.txt")
+        if os.path.exists(file_path):
+            print(f"✓ File created at: {file_path}")
+        print()
+
+        # Read it back
+        result = unsafe_local_bash_executor("cat myfile.txt", working_dir=tmpdir)
+        print("Command: cat myfile.txt")
+        print(f"Output: {result.stdout}")
+        print()
+
+        # Writing to /tmp is always allowed (temp directory exception)
+        result = unsafe_local_bash_executor(
+            "touch /tmp/tmpfile.txt", working_dir=tmpdir
+        )
+        print(f"Command: touch /tmp/tmpfile.txt (with working_dir={tmpdir})")
+        print(f"Success: {result.success} (note: /tmp is always allowed)")
+        print()
+
+        # Attempt to write to system paths (will be rejected)
+        result = unsafe_local_bash_executor("touch /etc/config.txt", working_dir=tmpdir)
+        print(f"Command: touch /etc/config.txt (with working_dir={tmpdir})")
+        print(f"Rejected: {result.skipped}")
+        print(f"Reason: {result.skip_message}")
+        print()
+
+
+def example_4_safety_features() -> None:
+    """Example 4: Demonstrate safety features."""
+    print("=== Example 4: Safety Features ===")
+
+    dangerous_commands = [
+        ("rm -rf /home", "Recursive force delete"),
+        ("git push --force", "Force git push"),
+        ("sudo whoami", "Privilege escalation"),
+        ("bash -i", "Interactive shell"),
+        ("touch /etc/config", "Write to system path"),
+    ]
+
+    for cmd, description in dangerous_commands:
+        result = unsafe_local_bash_executor(cmd)
+        print(f"{description}: {cmd}")
+        print(f"  Rejected: {result.skipped}")
+        print(f"  Reason: {result.skip_message}")
+        print()
+
+
+def example_5_error_handling() -> None:
+    """Example 5: Handle execution errors gracefully."""
+    print("=== Example 5: Error Handling ===")
+
+    # Command that fails (returns non-zero exit code)
+    result = unsafe_local_bash_executor("false")
+    print("Command: false (POSIX command that returns exit code 1)")
+    print(f"Success: {result.success}")
+    print(f"Return code indicates failure: {not result.success}")
+    print()
+
+    # Command that doesn't exist
+    result = unsafe_local_bash_executor("nonexistent_command_xyz")
+    print("Command: nonexistent_command_xyz")
+    print(f"Success: {result.success}")
+    if not result.success and result.stderr is not None:
+        print(f"Error output: {result.stderr[:100]}")
+    print()
+
+
+if __name__ == "__main__":
+    example_1_direct_execution()
+    example_2_wrapped_as_tool()
+
+    # Example 3: Run with LLM-based tool calling (requires Ollama or compatible LLM)
+    # Uncomment these lines to test LLM-generated commands:
+    # try:
+    #     m = start_session()
+    #     example_3_llm_with_forced_tool_use(m)
+    # except Exception as e:
+    #     print(f"Example 3 skipped: {e!s}")
+    #     print("  Requires: Ollama running locally or compatible LLM configured")
+    #     print("  See: https://docs.ollama.ai/")
+
+    example_3_with_working_dir()
+    example_4_safety_features()
+    example_5_error_handling()
@@ -1,5 +1,20 @@
 """Implementations of tools."""
 
 from .interpreter import code_interpreter, local_code_interpreter
+from .shell import (
+    BashEnvironment,
+    LLMSandboxBashEnvironment,
+    StaticBashEnvironment,
+    bash_executor,
+    unsafe_local_bash_executor,
+)
 
-__all__ = ["code_interpreter", "local_code_interpreter"]
+__all__ = [
+    "BashEnvironment",
+    "LLMSandboxBashEnvironment",
+    "StaticBashEnvironment",
+    "bash_executor",
+    "code_interpreter",
+    "local_code_interpreter",
+    "unsafe_local_bash_executor",
+]