fix: JsonPlusRedisSerializer

keenborder786 · keenborder786 · commit 77054cba8325 · 2025-10-23T00:27:59.000+05:00
diff --git a/langgraph/checkpoint/redis/jsonplus_redis.py b/langgraph/checkpoint/redis/jsonplus_redis.py
@@ -40,6 +40,15 @@ class JsonPlusRedisSerializer(JsonPlusSerializer):
 
     def dumps(self, obj: Any) -> bytes:
         """Use orjson for simple objects, fallback to parent for complex objects."""
+        try:
+            # Check if this is an Interrupt object that needs special handling
+            from langgraph.types import Interrupt
+            if isinstance(obj, Interrupt):
+                # Serialize Interrupt as a constructor format for proper deserialization
+                return super().dumps(obj)
+        except ImportError:
+            pass
+        
         try:
             # Fast path: Use orjson for JSON-serializable objects
             return orjson.dumps(obj)
@@ -66,6 +75,10 @@ def _revive_if_needed(self, obj: Any) -> Any:
         reconstructed. Without this, messages would remain as dictionaries with
         'lc', 'type', and 'constructor' fields, causing errors when the application
         expects actual message objects with 'role' and 'content' attributes.
+        
+        This also handles Interrupt objects that may be stored as plain dictionaries
+        with 'value' and 'id' keys, reconstructing them as proper Interrupt instances
+        to prevent AttributeError when accessing the 'id' attribute.
 
         Args:
             obj: The object to potentially revive, which may be a dict, list, or primitive.
@@ -80,6 +93,24 @@ def _revive_if_needed(self, obj: Any) -> Any:
                 # This converts {'lc': 1, 'type': 'constructor', ...} back to
                 # the actual LangChain object (e.g., HumanMessage, AIMessage)
                 return self._reviver(obj)
+            
+            # Check if this looks like an Interrupt object stored as a plain dict
+            # Interrupt objects have 'value' and 'id' keys, and possibly nothing else
+            # We need to be careful not to accidentally convert other dicts
+            if (
+                "value" in obj
+                and "id" in obj
+                and len(obj) == 2
+                and isinstance(obj.get("id"), str)
+            ):
+                # Try to reconstruct as an Interrupt object
+                try:
+                    from langgraph.types import Interrupt
+                    return Interrupt(value=obj["value"], id=obj["id"])
+                except (ImportError, TypeError, ValueError):
+                    # If we can't import or construct Interrupt, fall through
+                    pass
+            
             # Recursively process nested dicts
             return {k: self._revive_if_needed(v) for k, v in obj.items()}
         elif isinstance(obj, list):
diff --git a/tests/test_interrupt_serialization_fix.py b/tests/test_interrupt_serialization_fix.py
@@ -0,0 +1,334 @@
+"""Test for Interrupt serialization fix (GitHub Issue #33556).
+
+This test verifies that Interrupt objects are properly serialized and deserialized
+by the JsonPlusRedisSerializer, preventing the AttributeError that occurs when
+code tries to access the 'id' attribute on what it expects to be an Interrupt
+object but is actually a plain dictionary.
+
+Issue: https://github.com/langchain-ai/langchain/issues/33556
+"""
+
+import asyncio
+import json
+import uuid
+from typing import Any
+
+import pytest
+from langchain_core.runnables import RunnableConfig
+from langgraph.checkpoint.base import Checkpoint, CheckpointMetadata
+from langgraph.types import Interrupt, interrupt
+
+from langgraph.checkpoint.redis import RedisSaver
+from langgraph.checkpoint.redis.aio import AsyncRedisSaver
+from langgraph.checkpoint.redis.jsonplus_redis import JsonPlusRedisSerializer
+
+
+class TestInterruptSerialization:
+    """Test suite for Interrupt object serialization and deserialization."""
+
+    def test_interrupt_direct_serialization(self):
+        """Test that Interrupt objects are properly serialized and deserialized."""
+        serializer = JsonPlusRedisSerializer()
+        
+        # Create an Interrupt object
+        interrupt_obj = Interrupt(
+            value={"tool_name": "external_action", "message": "Need approval"},
+            id="test-interrupt-123"
+        )
+        
+        # Test serialization/deserialization
+        serialized = serializer.dumps(interrupt_obj)
+        deserialized = serializer.loads(serialized)
+        
+        # Verify it's an Interrupt object with the correct attributes
+        assert isinstance(deserialized, Interrupt), f"Expected Interrupt, got {type(deserialized)}"
+        assert hasattr(deserialized, 'id'), "Deserialized object should have 'id' attribute"
+        assert deserialized.id == "test-interrupt-123", f"ID mismatch: {deserialized.id}"
+        assert deserialized.value == {"tool_name": "external_action", "message": "Need approval"}
+
+    def test_interrupt_constructor_format(self):
+        """Test that Interrupt objects are serialized in LangChain constructor format."""
+        serializer = JsonPlusRedisSerializer()
+        
+        interrupt_obj = Interrupt(
+            value={"data": "test"},
+            id="constructor-test-id"
+        )
+        
+        serialized = serializer.dumps(interrupt_obj)
+        
+        # Parse the JSON to check the format
+        parsed = json.loads(serialized)
+        assert parsed.get("lc") == 2, "Should have lc=2 for constructor format"
+        assert parsed.get("type") == "constructor", "Should have type=constructor"
+        assert parsed.get("id") == ["langgraph", "types", "Interrupt"], "Should have correct id path"
+        assert "kwargs" in parsed, "Should have kwargs field"
+        assert parsed["kwargs"]["id"] == "constructor-test-id"
+
+    def test_plain_dict_reconstruction(self):
+        """Test that plain dicts with value/id keys are reconstructed as Interrupt objects."""
+        serializer = JsonPlusRedisSerializer()
+        
+        # This simulates what happens when Interrupt is stored as plain dict
+        plain_dict_interrupt = {"value": {"data": "test"}, "id": "plain-id"}
+        serialized = serializer.dumps(plain_dict_interrupt)
+        deserialized = serializer.loads(serialized)
+        
+        # Should be reconstructed as an Interrupt
+        assert isinstance(deserialized, Interrupt), f"Expected Interrupt, got {type(deserialized)}"
+        assert hasattr(deserialized, 'id'), "Should have 'id' attribute"
+        assert deserialized.id == "plain-id", f"ID should be preserved: {deserialized.id}"
+        assert deserialized.value == {"data": "test"}
+
+    def test_nested_interrupt_in_list(self):
+        """Test Interrupt serialization in nested structures like pending_writes."""
+        serializer = JsonPlusRedisSerializer()
+        
+        # Simulate pending_writes structure
+        interrupt_obj = Interrupt(value={"interrupt": "data"}, id="nested-id")
+        nested_data = [
+            ("task1", interrupt_obj),
+            ("task2", {"regular": "dict"})
+        ]
+        
+        serialized = serializer.dumps(nested_data)
+        deserialized = serializer.loads(serialized)
+        
+        # Verify the Interrupt in the nested structure
+        assert len(deserialized) == 2
+        task1_value = deserialized[0][1]
+        task2_value = deserialized[1][1]
+        
+        assert isinstance(task1_value, Interrupt), "task1 should have Interrupt"
+        assert task1_value.id == "nested-id"
+        assert isinstance(task2_value, dict), "task2 should remain dict"
+
+    def test_plain_dict_in_nested_structure(self):
+        """Test that plain dicts with value/id in nested structures are reconstructed."""
+        serializer = JsonPlusRedisSerializer()
+        
+        # Simulate the problematic case from the issue
+        nested_structure = [
+            ("task1", {"value": {"interrupt": "data"}, "id": "interrupt-1"}),
+            ("task2", {"normal": "dict", "no": "conversion"}),
+        ]
+        
+        serialized = serializer.dumps(nested_structure)
+        deserialized = serializer.loads(serialized)
+        
+        task1_value = deserialized[0][1]
+        task2_value = deserialized[1][1]
+        
+        # task1 should be reconstructed as Interrupt
+        assert isinstance(task1_value, Interrupt), f"task1 should have Interrupt, got {type(task1_value)}"
+        assert task1_value.id == "interrupt-1"
+        # This is the line that would fail in the original bug
+        interrupt_id = task1_value.id  # Should not raise AttributeError
+        assert interrupt_id == "interrupt-1"
+        
+        # task2 should remain a dict
+        assert isinstance(task2_value, dict), f"task2 should remain dict, got {type(task2_value)}"
+
+    def test_edge_cases_not_converted(self):
+        """Test that dicts that shouldn't be converted to Interrupt remain as dicts."""
+        serializer = JsonPlusRedisSerializer()
+        
+        # Dict with non-string id - should not convert
+        non_string_id = {"value": "test", "id": 123}
+        result = serializer.loads(serializer.dumps(non_string_id))
+        assert isinstance(result, dict), "Should not convert when id is not string"
+        
+        # Dict with extra fields - should not convert
+        extra_fields = {"value": "test", "id": "test-id", "extra": "field"}
+        result = serializer.loads(serializer.dumps(extra_fields))
+        assert isinstance(result, dict), "Should not convert when extra fields present"
+        
+        # Dict with only value - should not convert
+        only_value = {"value": "test"}
+        result = serializer.loads(serializer.dumps(only_value))
+        assert isinstance(result, dict), "Should not convert with only value field"
+        
+        # Dict with only id - should not convert
+        only_id = {"id": "test-id"}
+        result = serializer.loads(serializer.dumps(only_id))
+        assert isinstance(result, dict), "Should not convert with only id field"
+
+    def test_complex_interrupt_value(self):
+        """Test Interrupt with complex nested value structures."""
+        serializer = JsonPlusRedisSerializer()
+        
+        complex_value = {
+            "tool_name": "external_action",
+            "tool_args": {
+                "name": "Foo",
+                "config": {"timeout": 30, "retries": 3},
+                "nested": {"deep": {"structure": ["a", "b", "c"]}}
+            },
+            "metadata": {"timestamp": "2024-01-01", "user_id": "user123"}
+        }
+        
+        interrupt_obj = Interrupt(value=complex_value, id="complex-id")
+        
+        serialized = serializer.dumps(interrupt_obj)
+        deserialized = serializer.loads(serialized)
+        
+        assert isinstance(deserialized, Interrupt)
+        assert deserialized.id == "complex-id"
+        assert deserialized.value == complex_value
+        assert deserialized.value["tool_args"]["nested"]["deep"]["structure"] == ["a", "b", "c"]
+
+
+@pytest.mark.asyncio
+class TestInterruptSerializationAsync:
+    """Async tests for Interrupt serialization with Redis checkpointers."""
+
+    async def test_interrupt_in_checkpoint_async(self, redis_url: str):
+        """Test that Interrupt objects in checkpoints are properly handled."""
+        async with AsyncRedisSaver.from_conn_string(redis_url) as checkpointer:
+            thread_id = f"test-interrupt-{uuid.uuid4()}"
+            config = {
+                "configurable": {
+                    "thread_id": thread_id,
+                    "checkpoint_ns": "",
+                    "checkpoint_id": str(uuid.uuid4()),
+                }
+            }
+            
+            # Create an Interrupt object
+            interrupt_obj = Interrupt(
+                value={
+                    "tool_name": "external_action",
+                    "tool_args": {"name": "TestArg"},
+                    "message": "Need external system call",
+                },
+                id="async-interrupt-id"
+            )
+            
+            # Create checkpoint with Interrupt in pending_writes
+            checkpoint = {
+                "v": 1,
+                "ts": "2024-01-01T00:00:00+00:00",
+                "id": config["configurable"]["checkpoint_id"],
+                "channel_values": {"messages": ["test message"]},
+                "channel_versions": {},
+                "versions_seen": {},
+                "pending_writes": [
+                    ("interrupt_task", interrupt_obj),
+                ],
+            }
+            
+            metadata = {"source": "test", "step": 1, "writes": {}}
+            
+            # Save the checkpoint
+            await checkpointer.aput(config, checkpoint, metadata, {})
+            
+            # Retrieve the checkpoint
+            checkpoint_tuple = await checkpointer.aget_tuple(config)
+            
+            assert checkpoint_tuple is not None
+            
+            # Verify pending_writes contains an Interrupt object
+            assert len(checkpoint_tuple.pending_writes) == 1
+            task_id, value = checkpoint_tuple.pending_writes[0]
+            
+            assert task_id == "interrupt_task"
+            assert isinstance(value, Interrupt), f"Expected Interrupt, got {type(value)}"
+            assert hasattr(value, 'id'), "Should have 'id' attribute"
+            assert value.id == "async-interrupt-id"
+            
+            # This simulates the code that was failing in the issue
+            # It should not raise AttributeError
+            pending_interrupts = {}
+            for task_id, val in checkpoint_tuple.pending_writes:
+                if isinstance(val, Interrupt):
+                    pending_interrupts[task_id] = val.id
+            
+            assert pending_interrupts == {"interrupt_task": "async-interrupt-id"}
+
+    async def test_multiple_interrupts_async(self, redis_url: str):
+        """Test handling multiple Interrupt objects in a checkpoint."""
+        async with AsyncRedisSaver.from_conn_string(redis_url) as checkpointer:
+            thread_id = f"test-multi-interrupt-{uuid.uuid4()}"
+            config = {
+                "configurable": {
+                    "thread_id": thread_id,
+                    "checkpoint_ns": "",
+                    "checkpoint_id": str(uuid.uuid4()),
+                }
+            }
+            
+            # Create multiple Interrupts
+            interrupts = [
+                ("task1", Interrupt(value={"action": "approve"}, id="interrupt-1")),
+                ("task2", Interrupt(value={"action": "deny"}, id="interrupt-2")),
+                ("task3", {"regular": "dict", "not": "interrupt"}),
+                ("task4", Interrupt(value={"action": "retry"}, id="interrupt-3")),
+            ]
+            
+            checkpoint = {
+                "v": 1,
+                "ts": "2024-01-01T00:00:00+00:00",
+                "id": config["configurable"]["checkpoint_id"],
+                "channel_values": {},
+                "channel_versions": {},
+                "versions_seen": {},
+                "pending_writes": interrupts,
+            }
+            
+            metadata = {"source": "test", "step": 1}
+            
+            await checkpointer.aput(config, checkpoint, metadata, {})
+            checkpoint_tuple = await checkpointer.aget_tuple(config)
+            
+            assert checkpoint_tuple is not None
+            assert len(checkpoint_tuple.pending_writes) == 4
+            
+            # Verify each item
+            for i, (task_id, value) in enumerate(checkpoint_tuple.pending_writes):
+                if task_id in ["task1", "task2", "task4"]:
+                    assert isinstance(value, Interrupt), f"{task_id} should have Interrupt"
+                    assert hasattr(value, 'id')
+                    # Verify we can access the id without error
+                    _ = value.id
+                elif task_id == "task3":
+                    assert isinstance(value, dict), "task3 should remain dict"
+
+
+class TestInterruptSerializationSync:
+    """Sync tests for Interrupt serialization with Redis checkpointers."""
+
+    def test_interrupt_with_empty_value(self):
+        """Test Interrupt with None or empty value."""
+        serializer = JsonPlusRedisSerializer()
+        
+        # Interrupt with None value
+        interrupt_none = Interrupt(value=None, id="none-value-id")
+        result = serializer.loads(serializer.dumps(interrupt_none))
+        assert isinstance(result, Interrupt)
+        assert result.value is None
+        assert result.id == "none-value-id"
+        
+        # Interrupt with empty dict value
+        interrupt_empty = Interrupt(value={}, id="empty-value-id")
+        result = serializer.loads(serializer.dumps(interrupt_empty))
+        assert isinstance(result, Interrupt)
+        assert result.value == {}
+        assert result.id == "empty-value-id"
+
+    def test_backwards_compatibility(self):
+        """Test that the fix doesn't break existing non-Interrupt data."""
+        serializer = JsonPlusRedisSerializer()
+        
+        # Various data types that should work as before
+        test_cases = [
+            {"message": "regular dict", "type": "test"},
+            ["list", "of", "strings"],
+            {"nested": {"structure": {"with": ["mixed", "types", 123]}}},
+            {"value": "has value key but not id"},
+            {"id": "has id key but not value"},
+            {"value": 123, "id": "non-string-value", "extra": "field"},
+        ]
+        
+        for original in test_cases:
+            result = serializer.loads(serializer.dumps(original))
+            assert result == original, f"Data should be unchanged: {original}"