chore: update shell command timeout to 3600 seconds across configuration files and documentation

Codex · Codex · commit c3869f45e689 · 2026-03-23T11:20:21.000+08:00
diff --git a/.env.example b/.env.example
@@ -39,6 +39,9 @@ OPENROUTER_API_KEY=sk-or-your-openrouter-api-key-here
 # Custom base URL for providers (e.g., local LLM servers)
 # BASE_URL=https://your-custom-endpoint/v1
 
+# Shell command timeout in seconds (default: 3600 = 60 minutes)
+# SPOON_BOT_SHELL_TIMEOUT=3600
+
 # ======= Session Persistence (optional, default: file) =======
 #
 # Backend options: file (JSONL, default), sqlite, postgres
diff --git a/.gitignore b/.gitignore
@@ -76,3 +76,7 @@ test_spoon.py
 
 # Config file with credentials
 config.yaml
+
+workspace/*
+sessions/*
+memory/*
diff --git a/Dockerfile b/Dockerfile
@@ -106,7 +106,7 @@ ENV JWT_ACCESS_EXPIRE_MINUTES=15
 
 # --- Agent Settings ---
 ENV SPOON_BOT_MAX_ITERATIONS=20
-ENV SPOON_BOT_SHELL_TIMEOUT=60
+ENV SPOON_BOT_SHELL_TIMEOUT=3600
 ENV SPOON_BOT_MAX_OUTPUT=10000
 ENV SPOON_BOT_LOG_LEVEL=INFO
 
diff --git a/README.md b/README.md
@@ -503,7 +503,7 @@ The agent includes its context budget in the system prompt, allowing it to adjus
 │                       SPOON-BOT TOOLS                            │
 ├──────────────────────────────────────────────────────────────────┤
 │  Native OS Tools (Always Available, Priority)                    │
-│  ├── shell           Execute commands (60s timeout, 10KB limit)  │
+│  ├── shell           Execute commands (3600s timeout, 10KB limit) │
 │  ├── read_file       Read file contents                          │
 │  ├── write_file      Write content to file                       │
 │  ├── edit_file       Edit file by replacing text                 │
diff --git a/config.example.yaml b/config.example.yaml
@@ -24,7 +24,7 @@ agent:
   #   filesystem:
   #     command: "npx"
   #     args: ["-y", "@modelcontextprotocol/server-filesystem", "."]
-  # shell_timeout: 60
+  # shell_timeout: 3600
   # max_output: 10000
   # context_window: 200000
   # auto_reload: false          # Watch skill paths & config for changes, auto-reload
diff --git a/spoon_bot/agent/loop.py b/spoon_bot/agent/loop.py
@@ -319,7 +319,7 @@ def __init__(
         api_key: str | None = None,
         base_url: str | None = None,
         max_iterations: int = 50,
-        shell_timeout: int = 90,
+        shell_timeout: int = 3600,
         max_output: int = 10000,
         session_key: str = "default",
         skill_paths: list[Path | str] | None = None,
@@ -672,8 +672,9 @@ async def initialize(self) -> None:
         # Initialize agent
         await self._agent.initialize()
 
-        # Increase default step timeout — on-chain txs (cast send) can take 60s+
-        self._agent._default_timeout = 300.0
+        # Keep the agent's per-step timeout aligned with the configured shell timeout
+        # so long-running commands are not cancelled prematurely by the outer loop.
+        self._agent._default_timeout = max(300.0, float(self.shell_timeout))
 
         self._initialized = True
         active_count = len(self.tools.get_active_tools())
diff --git a/spoon_bot/agent/tools/self_config.py b/spoon_bot/agent/tools/self_config.py
@@ -204,7 +204,7 @@ def _get_defaults(self) -> dict[str, Any]:
         return {
             "model": "claude-sonnet-4.6",
             "max_iterations": 50,
-            "shell_timeout": 60,
+            "shell_timeout": 3600,
             "max_output": 10000,
             "provider": "anthropic",
         }
diff --git a/spoon_bot/agent/tools/shell.py b/spoon_bot/agent/tools/shell.py
@@ -372,7 +372,7 @@ class ShellTool(Tool):
 
     def __init__(
         self,
-        timeout: int = 60,
+        timeout: int = 3600,
         max_output: int = 10000,
         working_dir: str | None = None,
         whitelist_mode: bool = False,
@@ -389,7 +389,7 @@ def __init__(
         Initialize shell tool.
 
         Args:
-            timeout: Command timeout in seconds (default 60).
+            timeout: Command timeout in seconds (default 3600).
             max_output: Maximum output characters (default 10000).
             working_dir: Default working directory.
             whitelist_mode: If True, only allow whitelisted commands.
diff --git a/spoon_bot/bus/events.py b/spoon_bot/bus/events.py
@@ -24,6 +24,9 @@ class InboundMessage:
     timestamp: datetime = field(default_factory=datetime.now)
     media: list[str] = field(default_factory=list)
     metadata: dict[str, Any] = field(default_factory=dict)
+    # Sequence number assigned by MessageBus for latest-wins ordering.
+    # 0 means not yet assigned.
+    _bus_seq: int = field(default=0, repr=False)
 
     @property
     def has_media(self) -> bool:
diff --git a/spoon_bot/bus/queue.py b/spoon_bot/bus/queue.py
@@ -22,6 +22,9 @@ class MessageBus:
     - Handler registration
     - Channel routing
     - Error handling
+    - **Latest-wins per session**: when a new message arrives for a session
+      that already has an in-flight or queued message, the older message is
+      cancelled/skipped and only the newest message is processed.
     """
 
     def __init__(self, max_queue_size: int = 100, max_concurrency: int = 4):
@@ -41,6 +44,21 @@ def __init__(self, max_queue_size: int = 100, max_concurrency: int = 4):
         self._semaphore = asyncio.Semaphore(max_concurrency)
         self._active_tasks: set[asyncio.Task] = set()
 
+        # Message coalescing: when multiple messages arrive for the same
+        # session before processing begins, they are merged into a single
+        # message so the agent sees the full context (e.g. a follow-up
+        # clarification is kept together with the original request).
+        # If a task is already in-flight, it is cancelled and the new
+        # (merged) message is processed instead.
+        self._seq_counter: int = 0
+        self._latest_seq: dict[str, int] = {}
+        self._session_locks: dict[str, asyncio.Lock] = {}
+        self._session_tasks: dict[str, asyncio.Task] = {}
+        # Per-session accumulator: messages are buffered here on publish()
+        # and drained at processing time so that all pending messages for a
+        # session are coalesced into one.
+        self._session_buffer: dict[str, list[InboundMessage]] = {}
+
     def set_handler(self, handler: MessageHandler) -> None:
         """
         Set the message handler (typically the agent).
@@ -74,12 +92,39 @@ async def publish(self, message: InboundMessage) -> bool:
         would freeze the channel's event handler (e.g. Discord gateway
         heartbeats), potentially causing a disconnect.
 
+        **Message coalescing**: the message is added to a per-session
+        buffer *and* enqueued.  When processing starts, all buffered
+        messages for the session are merged into one so the agent sees
+        the full context (follow-ups, corrections, etc.).  If a task is
+        already running for this session, it is cancelled and the new
+        (coalesced) message takes over.
+
         Args:
             message: Inbound message from a channel.
 
         Returns:
             True if the message was enqueued, False if the queue is full.
         """
+        # Assign a sequence number for ordering
+        self._seq_counter += 1
+        message._bus_seq = self._seq_counter
+        session_key = message.session_key or message.channel
+        self._latest_seq[session_key] = self._seq_counter
+
+        # Accumulate in per-session buffer for coalescing at processing time
+        self._session_buffer.setdefault(session_key, []).append(message)
+
+        # Cancel the currently running task for this session (if any).
+        # The cancelled task will release its session lock, allowing the
+        # new (coalesced) message to proceed once it is dequeued.
+        existing_task = self._session_tasks.get(session_key)
+        if existing_task and not existing_task.done():
+            existing_task.cancel()
+            logger.info(
+                f"Cancelling in-flight task for session {session_key} — "
+                f"newer message arrived: {message.content[:50]}..."
+            )
+
         try:
             self._queue.put_nowait(message)
             logger.debug(f"Published message from {message.channel}: {message.content[:50]}...")
@@ -110,6 +155,9 @@ async def _process_message(self, message: InboundMessage) -> None:
                 else:
                     logger.warning(f"No outbound handler for channel: {target_channel}")
 
+        except asyncio.CancelledError:
+            # Let CancelledError propagate — the caller handles it.
+            raise
         except Exception as e:
             logger.error(f"Error processing message: {e}")
             # Send error response to ensure channel cleanup (typing, reactions).
@@ -129,11 +177,132 @@ async def _process_message(self, message: InboundMessage) -> None:
                 except Exception as send_err:
                     logger.error(f"Failed to send error response: {send_err}")
 
+    def _get_session_lock(self, session_key: str) -> asyncio.Lock:
+        """Return (or create) a per-session lock for serialised processing."""
+        lock = self._session_locks.get(session_key)
+        if lock is None:
+            lock = asyncio.Lock()
+            self._session_locks[session_key] = lock
+        return lock
+
+    @staticmethod
+    def _coalesce_messages(messages: list[InboundMessage]) -> InboundMessage:
+        """Merge a list of messages into one, preserving the latest metadata.
+
+        The content of all messages is joined with newlines so the agent
+        sees the full context.  Media attachments are concatenated.  All
+        other fields (channel, session_key, metadata, …) are taken from
+        the **last** message since it is the most recent user intent.
+        """
+        if len(messages) == 1:
+            return messages[0]
+
+        base = messages[-1]  # newest message is the base
+        merged_content = "\n".join(m.content for m in messages)
+
+        # Merge media from all messages (deduplicated, order preserved)
+        seen: set[str] = set()
+        merged_media: list[str] = []
+        for m in messages:
+            for path in m.media:
+                if path not in seen:
+                    seen.add(path)
+                    merged_media.append(path)
+
+        # Build the coalesced message from the newest, replacing content/media
+        coalesced = InboundMessage(
+            content=merged_content,
+            channel=base.channel,
+            session_key=base.session_key,
+            sender_id=base.sender_id,
+            sender_name=base.sender_name,
+            message_id=base.message_id,
+            timestamp=base.timestamp,
+            media=merged_media,
+            metadata=base.metadata.copy() if base.metadata else {},
+        )
+        coalesced._bus_seq = base._bus_seq
+        return coalesced
+
     async def _process_with_semaphore(self, message: InboundMessage) -> None:
-        """Process a single message under the concurrency semaphore."""
+        """Process a single message under the concurrency semaphore.
+
+        **Per-session serialisation**: messages belonging to the same
+        ``session_key`` are processed one at a time via a per-session lock
+        so that a fast second message cannot run concurrently with the
+        first.
+
+        **Message coalescing**: before starting actual work, all pending
+        messages for this session are drained from ``_session_buffer``
+        and merged into one.  This means follow-up messages ("also use
+        TypeScript") are kept together with the original request.
+
+        If this trigger message is not the latest for its session (i.e.
+        a newer trigger was already enqueued), it yields to the newer
+        trigger which will perform the coalescing instead.
+
+        **Cancellation-safe**: if this task is cancelled (because a newer
+        message triggered cancellation via ``publish()``), the session
+        lock and semaphore are properly released and the queue bookkeeping
+        is maintained.
+        """
+        session_key = message.session_key or message.channel
+        session_lock = self._get_session_lock(session_key)
+
         try:
-            async with self._semaphore:
-                await self._process_message(message)
+            # Acquire per-session lock first (no semaphore slot consumed
+            # while waiting, so other sessions are not starved).
+            async with session_lock:
+                # Only the trigger with the highest seq should coalesce
+                # and process.  Earlier triggers for the same session
+                # exit here — the latest trigger will pick up all
+                # buffered messages.
+                msg_seq = message._bus_seq
+                latest = self._latest_seq.get(session_key, 0)
+                if msg_seq < latest:
+                    logger.info(
+                        f"Skipping earlier trigger (seq={msg_seq}, "
+                        f"latest={latest}) for session {session_key}"
+                    )
+                    return
+
+                # Drain the per-session buffer and coalesce
+                buffered = self._session_buffer.pop(session_key, [])
+                if buffered:
+                    message = self._coalesce_messages(buffered)
+                    if len(buffered) > 1:
+                        logger.info(
+                            f"Coalesced {len(buffered)} messages for "
+                            f"session {session_key}"
+                        )
+
+                # Register as the active task for this session
+                current_task = asyncio.current_task()
+                self._session_tasks[session_key] = current_task  # type: ignore[assignment]
+
+                try:
+                    async with self._semaphore:
+                        await self._process_message(message)
+                except asyncio.CancelledError:
+                    logger.info(
+                        f"Task cancelled for session {session_key}: "
+                        f"{message.content[:50]}..."
+                    )
+                    # Do NOT re-raise inside the session_lock context —
+                    # we want to release the lock cleanly so the next
+                    # message can proceed.
+                    return
+                finally:
+                    # Only clear if we are still the registered task
+                    if self._session_tasks.get(session_key) is current_task:
+                        self._session_tasks.pop(session_key, None)
+        except asyncio.CancelledError:
+            # Cancelled while waiting for the session lock — nothing to
+            # clean up, just exit silently.
+            logger.debug(
+                f"Task cancelled while waiting for lock, "
+                f"session {session_key}: {message.content[:50]}..."
+            )
         finally:
             self._queue.task_done()
 
diff --git a/spoon_bot/config.py b/spoon_bot/config.py
@@ -373,7 +373,7 @@ class AgentLoopConfig(BaseModel):
         description="Maximum tool call iterations (1-100)"
     )
     shell_timeout: int = Field(
-        default=60,
+        default=3600,
         ge=1,
         le=3600,
         description="Shell command timeout in seconds (1-3600)"
@@ -578,7 +578,7 @@ class SpoonBotSettings(BaseSettings):
         description="Default max iterations"
     )
     shell_timeout: int = Field(
-        default=60,
+        default=3600,
         ge=1,
         le=3600,
         description="Default shell timeout"
@@ -666,7 +666,7 @@ def validate_agent_loop_params(
     workspace: Path | str | None = None,
     model: str | None = None,
     max_iterations: int = 20,
-    shell_timeout: int = 60,
+    shell_timeout: int = 3600,
     max_output: int = 10000,
     session_key: str = "default",
     skill_paths: list[Path | str] | None = None,

Original file line number	Diff line number	Diff line change
`@@ -39,6 +39,9 @@ OPENROUTER_API_KEY=sk-or-your-openrouter-api-key-here`
`39`	`39`	`# Custom base URL for providers (e.g., local LLM servers)`
`40`	`40`	`# BASE_URL=https://your-custom-endpoint/v1`
`41`	`41`
	`42`	`+# Shell command timeout in seconds (default: 3600 = 60 minutes)`
	`43`	`+# SPOON_BOT_SHELL_TIMEOUT=3600`
	`44`	`+`
`42`	`45`	`# ======= Session Persistence (optional, default: file) =======`
`43`	`46`	`#`
`44`	`47`	`# Backend options: file (JSONL, default), sqlite, postgres`
Original file line number	Diff line number	Diff line change
`@@ -204,7 +204,7 @@ def _get_defaults(self) -> dict[str, Any]:`
`204`	`204`	`return {`
`205`	`205`	`"model": "claude-sonnet-4.6",`
`206`	`206`	`"max_iterations": 50,`
`207`		`- "shell_timeout": 60,`
	`207`	`+ "shell_timeout": 3600,`
`208`	`208`	`"max_output": 10000,`
`209`	`209`	`"provider": "anthropic",`
`210`	`210`	`}`