lukeocodes
diff --git a/‎.github/workflows/release-please.yml‎
Lines changed: 18 additions & 19 deletions b/‎.github/workflows/release-please.yml‎
Lines changed: 18 additions & 19 deletions
diff --git a/‎docs/Message Splitting.md‎
Lines changed: 142 additions & 0 deletions b/‎docs/Message Splitting.md‎
Lines changed: 142 additions & 0 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 1 addition & 1 deletion b/‎pyproject.toml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎sentinel/services/moderation.py‎
Lines changed: 28 additions & 14 deletions b/‎sentinel/services/moderation.py‎
Lines changed: 28 additions & 14 deletions
diff --git a/‎sentinel/utils/discord.py‎
Lines changed: 76 additions & 0 deletions b/‎sentinel/utils/discord.py‎
Lines changed: 76 additions & 0 deletions
@@ -5,31 +5,30 @@ on:
         branches: [main]
 
 jobs:
-    # test:
-    #     runs-on: ubuntu-latest
-    #     steps:
-    #         - name: Checkout
-    #           uses: actions/checkout@v4
+    test:
+        runs-on: ubuntu-latest
+        steps:
+            - name: Checkout
+              uses: actions/checkout@v4
 
-    #         - name: Setup pnpm
-    #           uses: pnpm/action-setup@v4
-    #           with:
-    #               version: 9
+            - name: Install uv
+              uses: astral-sh/setup-uv@v5
+              with:
+                  enable-cache: true
 
-    #         - name: Setup Node.js
-    #           uses: actions/setup-node@v4
-    #           with:
-    #               node-version: 20
-    #               cache: "pnpm"
+            - name: Set up Python
+              uses: actions/setup-python@v5
+              with:
+                  python-version: "3.10"
 
-    #         - name: Install dependencies
-    #           run: pnpm install
+            - name: Install dependencies
+              run: uv sync --extra dev
 
-    #         - name: Run tests
-    #           run: pnpm test
+            - name: Run tests
+              run: uv run pytest -v
 
     release-please:
-        # needs: test
+        needs: test
         runs-on: ubuntu-latest
         permissions:
             contents: write
 
@@ -0,0 +1,142 @@
+# Message Splitting
+
+## Overview
+
+Discord enforces a maximum message length of 2,000 characters per message. When the bot generates responses that exceed this limit, the message splitting feature automatically divides the content into multiple messages while maintaining readability.
+
+## Architecture Decision
+
+**Decision**: Implement automatic message splitting at the message sending layer
+
+**Rationale**:
+
+- **User Experience**: Long responses should be delivered completely rather than truncated
+- **Transparency**: Multiple messages maintain the bot's complete thought process
+- **Natural Boundaries**: Smart splitting at paragraphs, sentences, or words maintains context
+- **Automatic**: No LLM intervention required - handled at the infrastructure level
+
+**Date**: 2025-10-24
+
+## How It Works
+
+### Split Algorithm
+
+The message splitting utility (`sentinel/utils/discord.py`) uses a hierarchical approach to find natural split points:
+
+1. **First Priority - Paragraph Boundaries**: Splits at newlines (`\n`) if found in the latter half of the allowed length
+2. **Second Priority - Sentence Boundaries**: Splits at periods followed by spaces if no good newline exists
+3. **Third Priority - Word Boundaries**: Splits at spaces to avoid breaking words
+4. **Last Resort**: Hard splits at the character limit (rare, only for very long words/URLs)
+
+### Message Sending Behavior
+
+When `send_message` is called with content exceeding 2,000 characters:
+
+1. Content is split into chunks using the smart splitting algorithm
+2. Each chunk is sent as a separate message in sequence
+3. Only the first message uses the reply reference (if provided)
+4. All messages are recorded for analytics and conversation tracking
+5. The last message is used as the conversation continuation point
+
+### Example
+
+```python
+# Input: 3,500 character message
+long_message = "..." * 3500
+
+# Output: 2 messages
+# Message 1: ~2,000 characters (split at paragraph)
+# Message 2: ~1,500 characters (remaining content)
+```
+
+## Implementation Details
+
+### Key Components
+
+1. **`sentinel/utils/discord.py:split_message()`**
+
+   - Core splitting logic
+   - Configurable max length (defaults to 2,000)
+   - Returns list of message chunks
+
+2. **`sentinel/services/moderation.py:_tool_send_message()`**
+   - Calls `split_message()` before sending
+   - Sends each chunk sequentially
+   - Handles reply references and threading for split messages
+
+### Edge Cases Handled
+
+- **Empty chunks**: Stripped whitespace means no empty messages are sent
+- **Single word longer than limit**: Falls back to hard split (extremely rare)
+- **Code blocks**: May be split mid-block (future enhancement: preserve code blocks)
+- **Mentions/formatting**: Preserved across splits (Discord handles this automatically)
+
+## Configuration
+
+No configuration is required - message splitting is automatic and always enabled.
+
+### Constants
+
+- `DISCORD_MAX_MESSAGE_LENGTH = 2000` (defined in `sentinel/utils/discord.py`)
+- Can be adjusted if Discord changes their limits
+
+## Testing
+
+The splitting algorithm can be tested independently:
+
+```python
+from sentinel.utils.discord import split_message
+
+# Test short message (no split needed)
+assert split_message("Hello") == ["Hello"]
+
+# Test long message (requires split)
+long_msg = "a" * 3000
+chunks = split_message(long_msg)
+assert len(chunks) == 2
+assert all(len(chunk) <= 2000 for chunk in chunks)
+
+# Test natural boundaries
+paragraph_msg = ("Paragraph 1.\n" * 100) + ("Paragraph 2.\n" * 100)
+chunks = split_message(paragraph_msg)
+# Should split at paragraph boundaries
+```
+
+## Future Enhancements
+
+1. **Code Block Preservation**: Detect triple-backtick code blocks and avoid splitting inside them
+2. **Embed Support**: Handle embeds differently (embeds have different length limits)
+3. **Continuation Indicators**: Add "..." or "(continued)" markers between split messages
+4. **Smart Numbering**: For list-based responses, ensure lists aren't split awkwardly
+
+## Related Documentation
+
+- [Architecture Overview](./Architecture%20Overview.md) - Overall bot architecture
+- [Heuristics System](./Heuristics%20System.md) - How bot learns patterns
+- Discord API Limits: https://discord.com/developers/docs/resources/channel#create-message
+
+## Troubleshooting
+
+### Messages are being cut off mid-sentence
+
+This shouldn't happen with the current implementation, but if it does:
+
+1. Check if the message contains very long paragraphs (>1000 characters) with no natural boundaries
+2. Verify the split algorithm is finding sentence/word boundaries correctly
+3. Add logging to see where splits are occurring
+
+### Bot is sending too many messages
+
+If the bot is generating excessively long responses (multiple splits):
+
+1. Consider adjusting the system prompt to encourage more concise responses
+2. Review the LLM's output to understand why it's generating such long content
+3. This is working as intended - the alternative is truncation
+
+### Split messages lose context
+
+The split algorithm preserves all content - no truncation occurs. If context appears lost:
+
+1. Verify the conversation manager is tracking the last message correctly
+2. Check that reply references are working for the first chunk
+3. Ensure threading behavior is correct for multi-message responses
@@ -28,4 +28,4 @@ select = ["E", "F", "B", "I"]
 ignore = ["E203", "E501"]
 
 [project.optional-dependencies]
-dev = ["black>=23.10.0", "ruff>=0.1.5"]
+dev = ["black>=23.10.0", "ruff>=0.1.5", "pytest>=7.4.0"]
@@ -1072,27 +1072,41 @@ async def _tool_send_message(
             except AttributeError:
                 reference = None
 
-        try:
-            sent_message = await send_channel.send(message_content, reference=reference)
-        except discord.Forbidden:
-            logger.warning("Insufficient permissions to send message in %s", send_channel)
-            return
-        except discord.HTTPException:
-            logger.exception("Failed to send message in %s", send_channel)
-            return
+        # Split message if it exceeds Discord's character limit
+        from ..utils.discord import split_message
+
+        message_chunks = split_message(message_content)
+
+        # Send all message chunks
+        sent_messages: List[discord.Message] = []
+        for i, chunk in enumerate(message_chunks):
+            # Only use reference for the first message
+            chunk_reference = reference if i == 0 else None
+
+            try:
+                sent_message = await send_channel.send(chunk, reference=chunk_reference)
+                sent_messages.append(sent_message)
+            except discord.Forbidden:
+                logger.warning("Insufficient permissions to send message in %s", send_channel)
+                return
+            except discord.HTTPException:
+                logger.exception("Failed to send message in %s", send_channel)
+                return
 
-        # Record bot's response in conversation if we have one
-        if conversation_id and self._conversations:
-            await self._conversations.record_bot_response(conversation_id, sent_message)
+        # Record bot's response in conversation if we have one (use the last message)
+        if conversation_id and self._conversations and sent_messages:
+            await self._conversations.record_bot_response(conversation_id, sent_messages[-1])
 
         # Record channel activity for analytics (not logged as an action since this is just a reply)
+        # Record activity for each sent message
         channel_for_log = (
             send_channel if isinstance(send_channel, discord.abc.GuildChannel) else resolved_channel
         )
         if isinstance(channel_for_log, discord.abc.GuildChannel):
-            await self._record_bot_channel_activity(
-                guild, channel_for_log, sent_message, context_tag
-            )
+            for sent_msg in sent_messages:
+                await self._record_bot_channel_activity(
+                    guild, channel_for_log, sent_msg, context_tag
+                )
 
     async def _tool_escalate(self, args: Dict[str, Any], context: EventContext) -> None:
         summary = args.get("summary")
 
@@ -0,0 +1,76 @@
+"""Discord-specific utility functions."""
+
+from __future__ import annotations
+
+from typing import List
+
+# Discord's maximum message length
+DISCORD_MAX_MESSAGE_LENGTH = 2000
+
+
+def split_message(content: str, max_length: int = DISCORD_MAX_MESSAGE_LENGTH) -> List[str]:
+    """Split a message into chunks that fit within Discord's character limit.
+
+    This function intelligently splits messages at natural boundaries (newlines,
+    sentences, words) to maintain readability while respecting Discord's 2000
+    character limit per message.
+
+    Args:
+        content: The message content to split
+        max_length: Maximum length per chunk (default: 2000 for Discord)
+
+    Returns:
+        List of message chunks, each under max_length characters
+
+    Examples:
+        >>> split_message("Short message")
+        ["Short message"]
+
+        >>> long_msg = "a" * 3000
+        >>> chunks = split_message(long_msg)
+        >>> len(chunks)
+        2
+        >>> all(len(chunk) <= 2000 for chunk in chunks)
+        True
+    """
+    if len(content) <= max_length:
+        return [content]
+
+    chunks: List[str] = []
+    remaining = content
+
+    while remaining:
+        if len(remaining) <= max_length:
+            chunks.append(remaining)
+            break
+
+        # Find the best split point within max_length
+        split_point = max_length
+
+        # Try to split at a newline (paragraph boundary)
+        newline_pos = remaining.rfind("\n", 0, max_length)
+        if newline_pos > max_length * 0.5:  # Only use if it's past halfway point
+            split_point = newline_pos + 1  # Include the newline in current chunk
+
+        # If no good newline, try to split at a sentence boundary
+        elif "." in remaining[:max_length]:
+            # Look for sentence endings: period followed by space or end
+            for i in range(max_length - 1, int(max_length * 0.5), -1):
+                if remaining[i] == "." and (i + 1 >= len(remaining) or remaining[i + 1] in " \n"):
+                    split_point = i + 1
+                    break
+
+        # If no sentence boundary, try to split at a word boundary
+        else:
+            space_pos = remaining.rfind(" ", 0, max_length)
+            if space_pos > max_length * 0.5:  # Only use if it's past halfway point
+                split_point = space_pos + 1  # Include the space
+
+        # Extract the chunk and update remaining
+        chunk = remaining[:split_point].rstrip()
+        if chunk:  # Only add non-empty chunks
+            chunks.append(chunk)
+
+        remaining = remaining[split_point:].lstrip()
+
+    return chunks