From be201ee8a806399f8879effb2c2a3dfa67ce0846 Mon Sep 17 00:00:00 2001
From: Gustav von Zitzewitz <gustav@openai.com>
Date: Mon, 12 Jan 2026 14:23:59 +0100
Subject: [PATCH 1/2] Enforce shell output length limits

---
 src/agents/_run_impl.py  | 49 +++++++++++++++++++++++++++++++++++++++-
 tests/test_shell_tool.py | 46 +++++++++++++++++++++++++++++++++++++
 2 files changed, 94 insertions(+), 1 deletion(-)

diff --git a/src/agents/_run_impl.py b/src/agents/_run_impl.py
index 2797113283..efc12a30b6 100644
--- a/src/agents/_run_impl.py
+++ b/src/agents/_run_impl.py
@@ -1739,6 +1739,7 @@ async def execute(
         shell_output_payload: list[dict[str, Any]] | None = None
         provider_meta: dict[str, Any] | None = None
         max_output_length: int | None = None
+        requested_max_output_length = shell_call.action.max_output_length
 
         try:
             executor_result = call.shell_tool.executor(request)
@@ -1748,12 +1749,19 @@ async def execute(
 
             if isinstance(result, ShellResult):
                 normalized = [_normalize_shell_output(entry) for entry in result.output]
+                max_output_length = result.max_output_length or requested_max_output_length
+                if max_output_length is not None:
+                    normalized = _truncate_shell_outputs(normalized, max_output_length)
                 output_text = _render_shell_outputs(normalized)
+                if max_output_length is not None:
+                    output_text = output_text[:max_output_length]
                 shell_output_payload = [_serialize_shell_output(entry) for entry in normalized]
                 provider_meta = dict(result.provider_data or {})
-                max_output_length = result.max_output_length
             else:
                 output_text = str(result)
+                if requested_max_output_length is not None:
+                    max_output_length = requested_max_output_length
+                    output_text = output_text[:max_output_length]
         except Exception as exc:
             status = "failed"
             output_text = _format_shell_error(exc)
@@ -2029,6 +2037,45 @@ def _render_shell_outputs(outputs: Sequence[ShellCommandOutput]) -> str:
     return "\n\n".join(rendered_chunks)
 
 
+def _truncate_shell_outputs(
+    outputs: Sequence[ShellCommandOutput], max_length: int
+) -> list[ShellCommandOutput]:
+    if max_length <= 0:
+        return [
+            ShellCommandOutput(
+                stdout="",
+                stderr="",
+                outcome=output.outcome,
+                command=output.command,
+                provider_data=output.provider_data,
+            )
+            for output in outputs
+        ]
+
+    remaining = max_length
+    truncated: list[ShellCommandOutput] = []
+    for output in outputs:
+        stdout = ""
+        stderr = ""
+        if remaining > 0 and output.stdout:
+            stdout = output.stdout[:remaining]
+            remaining -= len(stdout)
+        if remaining > 0 and output.stderr:
+            stderr = output.stderr[:remaining]
+            remaining -= len(stderr)
+        truncated.append(
+            ShellCommandOutput(
+                stdout=stdout,
+                stderr=stderr,
+                outcome=output.outcome,
+                command=output.command,
+                provider_data=output.provider_data,
+            )
+        )
+
+    return truncated
+
+
 def _format_shell_error(error: Exception | BaseException | Any) -> str:
     if isinstance(error, Exception):
         message = str(error)
diff --git a/tests/test_shell_tool.py b/tests/test_shell_tool.py
index d2132d6a2d..36a95e6ef3 100644
--- a/tests/test_shell_tool.py
+++ b/tests/test_shell_tool.py
@@ -135,3 +135,49 @@ def __call__(self, request):
     assert "status" not in payload_dict
     assert "shell_output" not in payload_dict
     assert "provider_data" not in payload_dict
+
+
+@pytest.mark.asyncio
+async def test_shell_tool_output_respects_max_output_length() -> None:
+    shell_tool = ShellTool(
+        executor=lambda request: ShellResult(
+            output=[
+                ShellCommandOutput(
+                    stdout="0123456789",
+                    stderr="abcdef",
+                    outcome=ShellCallOutcome(type="exit", exit_code=0),
+                )
+            ],
+        )
+    )
+
+    tool_call = {
+        "type": "shell_call",
+        "id": "shell_call",
+        "call_id": "call_shell",
+        "status": "completed",
+        "action": {
+            "commands": ["echo hi"],
+            "timeout_ms": 1000,
+            "max_output_length": 6,
+        },
+    }
+
+    tool_run = ToolRunShellCall(tool_call=tool_call, shell_tool=shell_tool)
+    agent = Agent(name="shell-agent", tools=[shell_tool])
+    context_wrapper: RunContextWrapper[Any] = RunContextWrapper(context=None)
+
+    result = await ShellAction.execute(
+        agent=agent,
+        call=tool_run,
+        hooks=RunHooks[Any](),
+        context_wrapper=context_wrapper,
+        config=RunConfig(),
+    )
+
+    assert isinstance(result, ToolCallOutputItem)
+    assert result.output == "012345"
+    raw_item = cast(dict[str, Any], result.raw_item)
+    assert raw_item["max_output_length"] == 6
+    assert raw_item["output"][0]["stdout"] == "012345"
+    assert raw_item["output"][0]["stderr"] == ""

From 32adfc2bc9bfd7a0652b11825457cfa30d3277e4 Mon Sep 17 00:00:00 2001
From: Gustav von Zitzewitz <gustav@openai.com>
Date: Tue, 13 Jan 2026 19:11:51 +0100
Subject: [PATCH 2/2] fix max_output_length=0 case

---
 src/agents/_run_impl.py  |  6 ++++-
 tests/test_shell_tool.py | 47 ++++++++++++++++++++++++++++++++++++++++
 2 files changed, 52 insertions(+), 1 deletion(-)

diff --git a/src/agents/_run_impl.py b/src/agents/_run_impl.py
index efc12a30b6..95bd87fc69 100644
--- a/src/agents/_run_impl.py
+++ b/src/agents/_run_impl.py
@@ -1749,7 +1749,11 @@ async def execute(
 
             if isinstance(result, ShellResult):
                 normalized = [_normalize_shell_output(entry) for entry in result.output]
-                max_output_length = result.max_output_length or requested_max_output_length
+                max_output_length = (
+                    result.max_output_length
+                    if result.max_output_length is not None
+                    else requested_max_output_length
+                )
                 if max_output_length is not None:
                     normalized = _truncate_shell_outputs(normalized, max_output_length)
                 output_text = _render_shell_outputs(normalized)
diff --git a/tests/test_shell_tool.py b/tests/test_shell_tool.py
index 36a95e6ef3..af2dfc9d77 100644
--- a/tests/test_shell_tool.py
+++ b/tests/test_shell_tool.py
@@ -181,3 +181,50 @@ async def test_shell_tool_output_respects_max_output_length() -> None:
     assert raw_item["max_output_length"] == 6
     assert raw_item["output"][0]["stdout"] == "012345"
     assert raw_item["output"][0]["stderr"] == ""
+
+
+@pytest.mark.asyncio
+async def test_shell_tool_executor_can_override_max_output_length_to_zero() -> None:
+    shell_tool = ShellTool(
+        executor=lambda request: ShellResult(
+            output=[
+                ShellCommandOutput(
+                    stdout="0123456789",
+                    stderr="abcdef",
+                    outcome=ShellCallOutcome(type="exit", exit_code=0),
+                )
+            ],
+            max_output_length=0,
+        )
+    )
+
+    tool_call = {
+        "type": "shell_call",
+        "id": "shell_call",
+        "call_id": "call_shell",
+        "status": "completed",
+        "action": {
+            "commands": ["echo hi"],
+            "timeout_ms": 1000,
+            "max_output_length": 6,
+        },
+    }
+
+    tool_run = ToolRunShellCall(tool_call=tool_call, shell_tool=shell_tool)
+    agent = Agent(name="shell-agent", tools=[shell_tool])
+    context_wrapper: RunContextWrapper[Any] = RunContextWrapper(context=None)
+
+    result = await ShellAction.execute(
+        agent=agent,
+        call=tool_run,
+        hooks=RunHooks[Any](),
+        context_wrapper=context_wrapper,
+        config=RunConfig(),
+    )
+
+    assert isinstance(result, ToolCallOutputItem)
+    assert result.output == ""
+    raw_item = cast(dict[str, Any], result.raw_item)
+    assert raw_item["max_output_length"] == 0
+    assert raw_item["output"][0]["stdout"] == ""
+    assert raw_item["output"][0]["stderr"] == ""