Skip to content
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
@@ -0,0 +1,123 @@
"""Save binary block outputs to workspace, return references instead of base64."""

import base64
import binascii
import hashlib
import logging
import uuid
from typing import Any

from backend.util.workspace import WorkspaceManager

logger = logging.getLogger(__name__)

BINARY_FIELDS = {"png", "jpeg", "pdf"} # Base64 encoded
TEXT_FIELDS = {"svg"} # Large text, save raw
SAVEABLE_FIELDS = BINARY_FIELDS | TEXT_FIELDS
SIZE_THRESHOLD = 1024 # Only process content > 1KB (string length, not decoded size)


async def process_binary_outputs(
outputs: dict[str, list[Any]],
workspace_manager: WorkspaceManager,
block_name: str,
) -> dict[str, list[Any]]:
"""
Replace binary data in block outputs with workspace:// references.

Deduplicates identical content within a single call (e.g., same PDF
appearing in both main_result and results).
"""
cache: dict[str, str] = {} # content_hash -> workspace_ref

processed: dict[str, list[Any]] = {}
for name, items in outputs.items():
processed_items: list[Any] = []
for item in items:
processed_items.append(
await _process_item(item, workspace_manager, block_name, cache)
)
processed[name] = processed_items
return processed


async def _process_item(
item: Any, wm: WorkspaceManager, block: str, cache: dict
) -> Any:
"""Recursively process an item, handling dicts and lists."""
if isinstance(item, dict):
return await _process_dict(item, wm, block, cache)
if isinstance(item, list):
processed: list[Any] = []
for i in item:
processed.append(await _process_item(i, wm, block, cache))
return processed
return item


async def _process_dict(
data: dict, wm: WorkspaceManager, block: str, cache: dict
) -> dict:
"""Process a dict, saving binary fields and recursing into nested structures."""
result: dict[str, Any] = {}

for key, value in data.items():
if (
key in SAVEABLE_FIELDS
and isinstance(value, str)
and len(value) > SIZE_THRESHOLD
):
content_hash = hashlib.sha256(value.encode()).hexdigest()
Copy link

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Bug: Deduplication fails because it hashes the raw base64 string before decoding, causing identical binary content with different string formats (e.g., with/without a data URI prefix) to be saved as separate files.
Severity: MEDIUM

Suggested Fix

The base64 string value should be decoded into its binary form before the hash is computed. This ensures that the hash represents the actual content, not its string representation, allowing for correct deduplication across different base64 formats.

Prompt for AI Agent
Review the code at the location below. A potential bug has been identified by an AI
agent.
Verify if this is a real issue. If it is, propose a fix; if not, explain why it's not
valid.

Location:
autogpt_platform/backend/backend/api/features/chat/tools/binary_output_processor.py#L70

Potential issue: The deduplication logic in `binary_output_processor.py` computes a
SHA256 hash on the raw base64 string representation of binary data at line 70. However,
the same binary content can be represented by different strings, such as raw base64
(`"ABC..."`) or a data URI (`"..."`). Because the hashing
occurs before the string is decoded, these different representations produce different
hashes for the same underlying data. This causes the deduplication to fail, leading to
redundant storage of identical binary files in the workspace and defeating the feature's
purpose of reducing storage and token overhead.

Did we get this right? 👍 / 👎 to inform future reviews.


if content_hash in cache:
result[key] = cache[content_hash]
elif ref := await _save(value, key, wm, block):
cache[content_hash] = ref
result[key] = ref
else:
result[key] = value # Save failed, keep original

elif isinstance(value, dict):
result[key] = await _process_dict(value, wm, block, cache)
elif isinstance(value, list):
processed: list[Any] = []
for i in value:
processed.append(await _process_item(i, wm, block, cache))
result[key] = processed
else:
result[key] = value

return result


async def _save(value: str, field: str, wm: WorkspaceManager, block: str) -> str | None:
"""Save content to workspace, return workspace:// reference or None on failure."""
try:
if field in BINARY_FIELDS:
content = _decode_base64(value)
if content is None:
return None
else:
content = value.encode("utf-8")

ext = {"jpeg": "jpg"}.get(field, field)
filename = f"{block.lower().replace(' ', '_')[:20]}_{field}_{uuid.uuid4().hex[:12]}.{ext}"

file = await wm.write_file(content=content, filename=filename)
return f"workspace://{file.id}"
Comment on lines +103 to +107
Copy link
Contributor

@coderabbitai coderabbitai bot Feb 4, 2026

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

⚠️ Potential issue | 🟠 Major

🧩 Analysis chain

🏁 Script executed:

find autogpt_platform/backend -name "workspace.py" -type f

Repository: Significant-Gravitas/AutoGPT

Length of output: 173


🏁 Script executed:

rg -n "def write_file" autogpt_platform/backend --type py -A 10 | head -50

Repository: Significant-Gravitas/AutoGPT

Length of output: 947


🏁 Script executed:

cat autogpt_platform/backend/backend/util/workspace.py | head -200

Repository: Significant-Gravitas/AutoGPT

Length of output: 6735


🏁 Script executed:

sed -n '155,250p' autogpt_platform/backend/backend/util/workspace.py

Repository: Significant-Gravitas/AutoGPT

Length of output: 3777


🏁 Script executed:

sed -n '215,240p' autogpt_platform/backend/backend/util/workspace.py

Repository: Significant-Gravitas/AutoGPT

Length of output: 951


🏁 Script executed:

find autogpt_platform/backend -name "workspace_storage.py" -type f

Repository: Significant-Gravitas/AutoGPT

Length of output: 130


🏁 Script executed:

rg -n "def store\|class.*Storage" autogpt_platform/backend/backend/util/workspace_storage.py -A 5 | head -80

Repository: Significant-Gravitas/AutoGPT

Length of output: 54


🏁 Script executed:

cat autogpt_platform/backend/backend/util/workspace_storage.py | head -300

Repository: Significant-Gravitas/AutoGPT

Length of output: 10397


🏁 Script executed:

rg -n "def sanitize_filename" autogpt_platform/backend --type py -A 15

Repository: Significant-Gravitas/AutoGPT

Length of output: 1471


🏁 Script executed:

cat autogpt_platform/backend/backend/api/features/chat/tools/binary_output_processor.py | head -120

Repository: Significant-Gravitas/AutoGPT

Length of output: 4119


Sanitize block parameter before using in filename.

The block parameter is only cleaned with .lower().replace(' ', '_'), which leaves path separators (/, \) and other unsafe characters. While LocalWorkspaceStorage mitigates this via sanitize_filename(), GCSWorkspaceStorage passes the filename directly to blob paths without sanitization, allowing malformed blob paths in cloud deployments.

Sanitize block before constructing the filename:

Suggested fix
+from backend.util.file import sanitize_filename
+
         ext = {"jpeg": "jpg"}.get(field, field)
-        filename = f"{block.lower().replace(' ', '_')[:20]}_{field}_{uuid.uuid4().hex[:12]}.{ext}"
+        safe_block = sanitize_filename(block.lower())[:20]
+        filename = f"{safe_block}_{field}_{uuid.uuid4().hex[:12]}.{ext}"
🤖 Prompt for AI Agents
In
`@autogpt_platform/backend/backend/api/features/chat/tools/binary_output_processor.py`
around lines 103 - 107, The filename construction uses the raw block value and
only lower()/replace(' ', '_'), which allows path separators and unsafe
characters to reach storage backends; update the filename creation in
binary_output_processor.py to sanitize the block first (e.g., strip or replace
path separators, remove or percent/underscore non-alphanumeric characters, allow
only [a-z0-9_-], and truncate to the desired length) before building filename =
f"{...}_{field}_{uuid...}.{ext}"; apply this sanitized_block when calling
wm.write_file so both LocalWorkspaceStorage and GCSWorkspaceStorage receive a
safe filename (you can reuse or call an existing sanitize_filename helper if
available, or add a small sanitizer function used by the code that creates the
filename).

Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

this is true 80% cnfidence

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

@ntindle Thank you for confirming! Since the block parameter comes from user-controlled input (block names), sanitizing it before filename construction will help ensure safe filenames across both local and cloud storage backends.

The suggested fix using sanitize_filename from backend.util.file should handle path separators, special characters, and other unsafe inputs. Let me know if you'd like me to help with anything else related to this change! 👍


🧠 Learnings used
Learnt from: CR
Repo: Significant-Gravitas/AutoGPT PR: 0
File: autogpt_platform/backend/CLAUDE.md:0-0
Timestamp: 2026-02-04T16:50:20.494Z
Learning: Applies to autogpt_platform/backend/backend/blocks/*.py : Never hardcode workspace checks when using `store_media_file()` - let `for_block_output` handle context adaptation automatically

Learnt from: CR
Repo: Significant-Gravitas/AutoGPT PR: 0
File: autogpt_platform/backend/CLAUDE.md:0-0
Timestamp: 2026-02-04T16:50:20.494Z
Learning: Applies to autogpt_platform/backend/backend/blocks/*.py : Always use `for_block_output` format in `store_media_file()` for block outputs unless there is a specific reason not to

Learnt from: CR
Repo: Significant-Gravitas/AutoGPT PR: 0
File: autogpt_platform/backend/CLAUDE.md:0-0
Timestamp: 2026-02-04T16:50:20.494Z
Learning: Applies to autogpt_platform/backend/backend/blocks/*.py : When working with files in blocks, use `store_media_file()` from `backend.util.file` with appropriate `return_format` parameter: `for_local_processing` for local tools, `for_external_api` for external APIs, `for_block_output` for block outputs

Learnt from: CR
Repo: Significant-Gravitas/AutoGPT PR: 0
File: .github/copilot-instructions.md:0-0
Timestamp: 2026-02-04T16:49:42.476Z
Learning: Applies to autogpt_platform/backend/backend/blocks/**/*.py : Generate block UUID using 'uuid.uuid4()' when creating new blocks in backend


except Exception as e:
logger.error(f"Failed to save {field} to workspace for block '{block}': {e}")
return None


def _decode_base64(value: str) -> bytes | None:
"""Decode base64, handling data URI format. Returns None on failure."""
try:
if value.startswith("data:"):
value = value.split(",", 1)[1] if "," in value else value
# Normalize padding and use strict validation to prevent corrupted data
padded = value + "=" * (-len(value) % 4)
return base64.b64decode(padded, validate=True)
except (binascii.Error, ValueError):
return None
Original file line number Diff line number Diff line change
Expand Up @@ -8,12 +8,16 @@
from pydantic_core import PydanticUndefined

from backend.api.features.chat.model import ChatSession
from backend.api.features.chat.tools.binary_output_processor import (
process_binary_outputs,
)
from backend.data.block import get_block
from backend.data.execution import ExecutionContext
from backend.data.model import CredentialsMetaInput
from backend.data.workspace import get_or_create_workspace
from backend.integrations.creds_manager import IntegrationCredentialsManager
from backend.util.exceptions import BlockError
from backend.util.workspace import WorkspaceManager

from .base import BaseTool
from .models import (
Expand Down Expand Up @@ -321,11 +325,19 @@ async def _execute(
):
outputs[output_name].append(output_data)

# Save binary outputs to workspace to prevent context bloat
workspace_manager = WorkspaceManager(
user_id, workspace.id, session.session_id
)
processed_outputs = await process_binary_outputs(
dict(outputs), workspace_manager, block.name
)

return BlockOutputResponse(
message=f"Block '{block.name}' executed successfully",
block_id=block_id,
block_name=block.name,
outputs=dict(outputs),
outputs=processed_outputs,
success=True,
session_id=session_id,
)
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,92 @@
import base64
from unittest.mock import AsyncMock, MagicMock

import pytest

from backend.api.features.chat.tools.binary_output_processor import (
_decode_base64,
process_binary_outputs,
)


@pytest.fixture
def workspace_manager():
wm = AsyncMock()
wm.write_file = AsyncMock(return_value=MagicMock(id="file-123"))
return wm


class TestDecodeBase64:
def test_raw_base64(self):
assert _decode_base64(base64.b64encode(b"test").decode()) == b"test"

def test_data_uri(self):
encoded = base64.b64encode(b"test").decode()
assert _decode_base64(f"data:image/png;base64,{encoded}") == b"test"

def test_invalid_returns_none(self):
assert _decode_base64("not base64!!!") is None


class TestProcessBinaryOutputs:
@pytest.mark.asyncio
async def test_saves_large_binary(self, workspace_manager):
content = base64.b64encode(b"x" * 2000).decode()
outputs = {"result": [{"png": content, "text": "ok"}]}

result = await process_binary_outputs(outputs, workspace_manager, "Test")

assert result["result"][0]["png"] == "workspace://file-123"
assert result["result"][0]["text"] == "ok"

@pytest.mark.asyncio
async def test_skips_small_content(self, workspace_manager):
content = base64.b64encode(b"tiny").decode()
outputs = {"result": [{"png": content}]}

result = await process_binary_outputs(outputs, workspace_manager, "Test")

assert result["result"][0]["png"] == content
workspace_manager.write_file.assert_not_called()

@pytest.mark.asyncio
async def test_deduplicates_identical_content(self, workspace_manager):
content = base64.b64encode(b"x" * 2000).decode()
outputs = {"a": [{"pdf": content}], "b": [{"pdf": content}]}

result = await process_binary_outputs(outputs, workspace_manager, "Test")

assert result["a"][0]["pdf"] == result["b"][0]["pdf"] == "workspace://file-123"
assert workspace_manager.write_file.call_count == 1

@pytest.mark.asyncio
async def test_failure_preserves_original(self, workspace_manager):
workspace_manager.write_file.side_effect = Exception("Storage error")
content = base64.b64encode(b"x" * 2000).decode()

result = await process_binary_outputs(
{"r": [{"png": content}]}, workspace_manager, "Test"
)

assert result["r"][0]["png"] == content

@pytest.mark.asyncio
async def test_handles_nested_structures(self, workspace_manager):
content = base64.b64encode(b"x" * 2000).decode()
outputs = {"result": [{"outer": {"inner": {"png": content}}}]}

result = await process_binary_outputs(outputs, workspace_manager, "Test")

assert result["result"][0]["outer"]["inner"]["png"] == "workspace://file-123"

@pytest.mark.asyncio
async def test_handles_lists_in_output(self, workspace_manager):
content = base64.b64encode(b"x" * 2000).decode()
outputs = {"result": [{"images": [{"png": content}, {"png": content}]}]}

result = await process_binary_outputs(outputs, workspace_manager, "Test")

assert result["result"][0]["images"][0]["png"] == "workspace://file-123"
assert result["result"][0]["images"][1]["png"] == "workspace://file-123"
# Deduplication should still work
assert workspace_manager.write_file.call_count == 1
Loading