generative-computing · HendrikStrobelt · Sep 29, 2025 · Sep 24, 2025 · Sep 24, 2025 · Sep 24, 2025
diff --git a/docs/examples/aLora/101_example.py b/docs/examples/aLora/101_example.py
@@ -1,10 +1,10 @@
 import time
 
-from mellea import LinearContext, MelleaSession
+from mellea import MelleaSession
 from mellea.backends.aloras.huggingface.granite_aloras import HFConstraintAlora
 from mellea.backends.cache import SimpleLRUCache
 from mellea.backends.huggingface import LocalHFBackend
-from mellea.stdlib.base import GenerateLog
+from mellea.stdlib.base import ChatContext, GenerateLog
 from mellea.stdlib.requirement import ALoraRequirement, Requirement
 
 # Define a backend and add the constraint aLora
@@ -22,7 +22,7 @@
 backend.add_alora(custom_stembolt_failure_constraint)
 
 # Create M session
-m = MelleaSession(backend, ctx=LinearContext())
+m = MelleaSession(backend, ctx=ChatContext())
 
 # define a requirement
 failure_check = ALoraRequirement(

diff --git a/docs/examples/agents/react.py b/docs/examples/agents/react.py
@@ -2,7 +2,7 @@
 import inspect
 import json
 from collections.abc import Callable
-from typing import Literal, Unpack
+from typing import Literal
 
 import pydantic
 from jinja2 import Template
@@ -13,6 +13,7 @@
 import mellea.stdlib
 import mellea.stdlib.base
 import mellea.stdlib.chat
+from mellea.stdlib.base import ChatContext
 
 react_system_template: Template = Template(
     """Answer the user's question as best you can.
@@ -83,7 +84,7 @@ def call_tool(self, tool: ReactTool, kwargs_json: str):
     def tool_name_schema(self):
         names = self.tool_names()
         fields = dict()
-        fields["tool"] = Literal[Unpack[names]]
+        fields["tool"] = Literal[*names]
         return pydantic.create_model("ToolSelectionSchema", **fields)
 
     def get_tool_from_schema(self, content: str):
@@ -103,7 +104,7 @@ def react(
     react_toolbox: ReactToolbox,
 ):
     assert m.ctx.is_chat_context, "ReACT requires a chat context."
-    test_ctx_lin = m.ctx.render_for_generation()
+    test_ctx_lin = m.ctx.view_for_generation()
     assert test_ctx_lin is not None and len(test_ctx_lin) == 0, (
         "ReACT expects a fresh context."
     )
@@ -114,8 +115,9 @@ def react(
     )
 
     # Add the system prompt and the goal to the chat history.
-    m.ctx.insert(mellea.stdlib.chat.Message(role="system", content=_sys_prompt))
-    m.ctx.insert(mellea.stdlib.chat.Message(role="user", content=f"{goal}"))
+    m.ctx = m.ctx.add(
+        mellea.stdlib.chat.Message(role="system", content=_sys_prompt)
+    ).add(mellea.stdlib.chat.Message(role="user", content=f"{goal}"))
 
     # The main ReACT loop as a dynamic program:
     # (  ?(not done) ;
@@ -156,7 +158,7 @@ def react(
 
         print("### Observation")
         tool_output = react_toolbox.call_tool(selected_tool, act_args.content)
-        m.ctx.insert(mellea.stdlib.chat.Message(role="tool", content=tool_output))
+        m.ctx = m.ctx.add(mellea.stdlib.chat.Message(role="tool", content=tool_output))
         print(tool_output)
 
         print("### Done Check")
@@ -178,7 +180,7 @@ def react(
 
 
 if __name__ == "__main__":
-    m = mellea.start_session(ctx=mellea.stdlib.base.LinearContext())
+    m = mellea.start_session(ctx=ChatContext())
 
     def zip_lookup_tool_fn(city: str):
         """Returns the ZIP code for the `city`."""

diff --git a/docs/examples/agents/react_instruct.py b/docs/examples/agents/react_instruct.py
@@ -2,7 +2,7 @@
 import inspect
 import json
 from collections.abc import Callable
-from typing import Literal, Unpack
+from typing import Literal
 
 import pydantic
 from jinja2 import Template
@@ -11,6 +11,7 @@
 import mellea.stdlib
 import mellea.stdlib.base
 import mellea.stdlib.chat
+from mellea.stdlib.base import ChatContext
 
 react_system_template: Template = Template(
     """Answer the user's question as best you can.
@@ -81,7 +82,7 @@ def call_tool(self, tool: ReactTool, kwargs_json: str):
     def tool_name_schema(self):
         names = self.tool_names()
         fields = dict()
-        fields["tool"] = Literal[Unpack[names]]
+        fields["tool"] = Literal[*names]
         return pydantic.create_model("ToolSelectionSchema", **fields)
 
     def get_tool_from_schema(self, content: str):
@@ -101,7 +102,7 @@ def react(
     react_toolbox: ReactToolbox,
 ):
     assert m.ctx.is_chat_context, "ReACT requires a chat context."
-    test_ctx_lin = m.ctx.render_for_generation()
+    test_ctx_lin = m.ctx.view_for_generation()
     assert test_ctx_lin is not None and len(test_ctx_lin) == 0, (
         "ReACT expects a fresh context."
     )
@@ -112,8 +113,9 @@ def react(
     )
 
     # Add the system prompt and the goal to the chat history.
-    m.ctx.insert(mellea.stdlib.chat.Message(role="system", content=_sys_prompt))
-    m.ctx.insert(mellea.stdlib.chat.Message(role="user", content=f"{goal}"))
+    m.ctx = m.ctx.add(
+        mellea.stdlib.chat.Message(role="system", content=_sys_prompt)
+    ).add(mellea.stdlib.chat.Message(role="user", content=f"{goal}"))
 
     # The main ReACT loop as a dynamic program:
     # (  ?(not done) ;
@@ -159,7 +161,7 @@ def react(
 
         print("### Observation")
         tool_output = react_toolbox.call_tool(selected_tool, act_args_val)
-        m.ctx.insert(mellea.stdlib.chat.Message(role="tool", content=tool_output))
+        m.ctx = m.ctx.add(mellea.stdlib.chat.Message(role="tool", content=tool_output))
         print(tool_output)
 
         print("### Done Check")
@@ -187,7 +189,7 @@ def react(
 
 
 if __name__ == "__main__":
-    m = mellea.start_session(ctx=mellea.stdlib.base.LinearContext())
+    m = mellea.start_session(ctx=ChatContext())
 
     def zip_lookup_tool_fn(city: str):
         """Returns the ZIP code for the `city`."""

diff --git a/docs/examples/generative_slots/generate_with_context.py b/docs/examples/generative_slots/generate_with_context.py
@@ -1,6 +1,6 @@
-from mellea import LinearContext, generative, start_session
+from mellea import generative, start_session
 from mellea.backends.types import ModelOption
-from mellea.stdlib.base import CBlock
+from mellea.stdlib.base import CBlock, ChatContext
 
 # Generative slots can be used with sessions that have context.
 # By utilizing context, you can change the results of several
@@ -34,7 +34,7 @@ def give_feedback(essay: str) -> list[str]:
 
 if __name__ == "__main__":
     m = start_session(
-        ctx=LinearContext(), model_options={ModelOption.MAX_NEW_TOKENS: 100}
+        ctx=ChatContext(), model_options={ModelOption.MAX_NEW_TOKENS: 100}
     )
 
     text = """
@@ -55,7 +55,7 @@ def give_feedback(essay: str) -> list[str]:
 
     # If you have a set of generative functions, you can tweak them all by
     # adding context to the session they are running in.
-    m.ctx.insert(
+    m.ctx = m.ctx.add(
         CBlock(
             "You are an elementary school teacher. "
             "Any grades and feedback that you give should keep that in mind. Remember to be "
@@ -74,7 +74,7 @@ def give_feedback(essay: str) -> list[str]:
 
     # And, let's reset the context and try a different grading style.
     m.reset()
-    m.ctx.insert(
+    m.ctx = m.ctx.add(
         CBlock(
             "You are a grammarian that is focused solely on spelling and syntax, "
             "not on the content of essays. When giving grades and feedback, focus "

diff --git a/docs/examples/helper/__init__.py b/docs/examples/helper/__init__.py
@@ -1 +1 @@
-from .helpers import Any, fill, w
+from .helpers import req_print, w
diff --git a/docs/examples/helper/helpers.py b/docs/examples/helper/helpers.py
@@ -1,7 +1,14 @@
 from textwrap import fill
 from typing import Any
 
+from mellea.stdlib.requirement import Requirement, ValidationResult
+
 
 # Just for printing stuff nicely...
 def w(x: Any) -> str:
     return fill(str(x), width=120, replace_whitespace=False)
+
+
+def req_print(rv_list: list[tuple[Requirement, ValidationResult]]) -> str:
+    parts = [f"{bool(rv[1])}\t: {rv[0].description}" for rv in rv_list]
+    return "\n".join(parts)
diff --git a/docs/examples/image_text_models/vision_ollama_chat.py b/docs/examples/image_text_models/vision_ollama_chat.py
@@ -2,11 +2,11 @@
 
 from PIL import Image
 
-from mellea import LinearContext, start_session
-from mellea.stdlib.base import ImageBlock
+from mellea import start_session
+from mellea.stdlib.base import ChatContext, ImageBlock
 
-m = start_session(model_id="granite3.2-vision", ctx=LinearContext())
-# m = start_session(model_id="llava", ctx=LinearContext())
+m = start_session(model_id="granite3.2-vision", ctx=ChatContext())
+# m = start_session(model_id="llava", ctx=ChatContext())
 
 # load image
 test_img = Image.open("pointing_up.jpg")

diff --git a/docs/examples/instruct_validate_repair/101_email.py b/docs/examples/instruct_validate_repair/101_email.py
@@ -1,30 +1,19 @@
 # This is the 101 example for using `session` and `instruct`.
 # helper function to wrap text
 from docs.examples.helper import w
-from mellea import instruct, start_session
+from mellea import start_session
 from mellea.backends.types import ModelOption
 
-# create a session using Granite 3.3 8B on Ollama and a simple context [see below]
-with start_session(model_options={ModelOption.MAX_NEW_TOKENS: 200}):
-    # write an email
-    email_v1 = instruct("Write an email to invite all interns to the office party.")
-
 with start_session(model_options={ModelOption.MAX_NEW_TOKENS: 200}) as m:
     # write an email
     email_v1 = m.instruct("Write an email to invite all interns to the office party.")
+    print(m.last_prompt())
 
 # print result
 print(f"***** email ****\n{w(email_v1)}\n*******")
 
 # ************** END *************
 
-
-# # optionally: print the debug log for the last instruction on the context
-# from mellea.stdlib.base import GenerateLog
-# _, log = m.ctx.last_output_and_logs()
-# if isinstance(log, GenerateLog): # should be
-#     print(f"Prompt:\n{w(log.prompt)}") # print prompt
-
 # # start_session() is equivalent to:
 # from mellea.backends import model_ids
 # from mellea.backends.ollama import OllamaModelBackend

diff --git a/docs/examples/instruct_validate_repair/101_email_with_requirements.py b/docs/examples/instruct_validate_repair/101_email_with_requirements.py
@@ -5,7 +5,7 @@
 # create a session using Granite 3.3 8B on Ollama and a simple context [see below]
 m = start_session(model_options={ModelOption.MAX_NEW_TOKENS: 200})
 
-# write an email
+# write an email with automatic requirement checking.
 email_v1 = m.instruct(
     "Write an email to invite all interns to the office party.",
     requirements=["be formal", "Use 'Dear interns' as greeting."],

diff --git a/docs/examples/instruct_validate_repair/101_email_with_validate.py b/docs/examples/instruct_validate_repair/101_email_with_validate.py
@@ -1,19 +1,29 @@
-from docs.examples.helper import w
+from docs.examples.helper import req_print, w
 from mellea import start_session
 from mellea.backends.types import ModelOption
 from mellea.stdlib.sampling import RejectionSamplingStrategy
 
 # create a session using Granite 3.3 8B on Ollama and a simple context [see below]
 m = start_session(model_options={ModelOption.MAX_NEW_TOKENS: 200})
 
-email_v1 = m.instruct(
+email_v2_samples = m.instruct(
     "Write an email to invite all interns to the office party.",
     requirements=["be formal", "Use 'Dear interns' as greeting."],
     strategy=RejectionSamplingStrategy(loop_budget=3),
+    return_sampling_results=True,
 )
 
-# print result
-print(f"***** email ****\n{w(email_v1)}\n*******")
+if email_v2_samples.success:
+    print(f"Success: \n{w(email_v2_samples.result)}")
+    print(
+        f"===> Requirement for this sample: \n{req_print(email_v2_samples.sample_validations[-1])}"
+    )
+else:
+    print(f"Failure: \n{w(email_v2_samples.result)}")
+    selected_index = email_v2_samples.sample_generations.index(email_v2_samples.result)
+    print(
+        f"===> Requirement for this sample: \n{req_print(email_v2_samples.sample_validations[selected_index])}"
+    )
 
 # # [optional] get logs for all loops:
 # from mellea.stdlib.base import GenerateLog

diff --git a/docs/examples/mify/rich_document_advanced.py b/docs/examples/mify/rich_document_advanced.py
@@ -9,7 +9,7 @@
 from mellea.stdlib.base import ModelOutputThunk, TemplateRepresentation
 
 # Use a `SimpleContext` so that each LLM call is independent.
-m = mellea.start_session(backend_name="hf", ctx=mellea.SimpleContext())
+m = mellea.start_session(backend_name="hf")
 
 # 2. Let's import docling so that we can process pdf documents.
 

diff --git a/docs/examples/notebooks/context_example.ipynb b/docs/examples/notebooks/context_example.ipynb
@@ -71,7 +71,7 @@
    "source": [
     "## Import Mellea and Start a Session with LinearContext\n",
     "\n",
-    "Up to this point we have used SimpleContext, a context manager that resets the chat message history on each model call. That is, the model's context is entirely determined by the current Component. \n",
+    "Up to this point we have used SimpleContext, a context manager that resets the chat message history on each model call. That is, the model's context is entirely determined by the current Component.\n",
     "\n",
     "Mellea also provides a LinearContext, which behaves like a chat history. We will use the LinearContext to interact with cat hmodels:"
    ]
@@ -84,9 +84,10 @@
    },
    "outputs": [],
    "source": [
-    "from mellea import LinearContext, start_session\n",
+    "from mellea import start_session\n",
+    "from mellea.stdlib.base import ChatContext\n",
     "\n",
-    "m = start_session(ctx=LinearContext())\n",
+    "m = start_session(ctx=ChatContext())\n",
     "m.chat(\"Make up a math problem.\")\n",
     "m.chat(\"Solve your math problem.\")\n",
     "print(m.ctx.last_output())\n",

diff --git a/docs/examples/notebooks/m_serve_example.ipynb b/docs/examples/notebooks/m_serve_example.ipynb
@@ -83,11 +83,11 @@
     "\n",
     "import mellea\n",
     "from cli.serve.models import ChatMessage\n",
-    "from mellea.stdlib.base import LinearContext, ModelOutputThunk\n",
+    "from mellea.stdlib.base import ChatContext, ModelOutputThunk\n",
     "from mellea.stdlib.requirement import Requirement, simple_validate\n",
     "from mellea.stdlib.sampling import RejectionSamplingStrategy, SamplingResult\n",
     "\n",
-    "session = mellea.start_session(ctx=LinearContext())\n",
+    "session = mellea.start_session(ctx=ChatContext())\n",
     "\n",
     "\n",
     "def validate_hi_bob(email: str) -> bool:\n",

diff --git a/docs/examples/safety.py/guardian.py b/docs/examples/safety.py/guardian.py
@@ -2,9 +2,8 @@
 
 from mellea import MelleaSession
 from mellea.backends import model_ids
-from mellea.backends.dummy import DummyBackend
 from mellea.backends.ollama import OllamaModelBackend
-from mellea.stdlib.base import Context, ContextTurn, ModelOutputThunk, SimpleContext
+from mellea.stdlib.base import ContextTurn, ModelOutputThunk
 from mellea.stdlib.chat import Message
 from mellea.stdlib.safety.guardian import GuardianCheck, GuardianRisk
 
@@ -25,10 +24,9 @@
 print("\n Test 2\n")
 
 # create a mean conversation and add to context
-m.ctx.insert_turn(
-    ContextTurn(Message("user", "Hello. "), ModelOutputThunk("You are very ugly."))
+m.ctx = m.ctx.add(Message("user", "Hello. ")).add(
+    ModelOutputThunk("You are very ugly.")
 )
-
 # show last turn in chat
 print(f"Context: {m.ctx.last_turn()}")
 

diff --git a/docs/examples/sessions/creating_a_new_type_of_session.py b/docs/examples/sessions/creating_a_new_type_of_session.py
@@ -3,7 +3,7 @@
 from mellea import MelleaSession
 from mellea.backends import Backend, BaseModelSubclass
 from mellea.backends.ollama import OllamaModelBackend
-from mellea.stdlib.base import CBlock, Context, LinearContext, ModelOutputThunk
+from mellea.stdlib.base import CBlock, ChatContext, Context, ModelOutputThunk
 from mellea.stdlib.chat import Message
 from mellea.stdlib.requirement import Requirement, reqify
 from mellea.stdlib.safety.guardian import GuardianCheck, GuardianRisk
@@ -66,7 +66,7 @@ def chat(
 m = ChatCheckingSession(
     requirements=[GuardianCheck("jailbreak"), GuardianCheck("profanity")],
     backend=OllamaModelBackend(),
-    ctx=LinearContext(),
+    ctx=ChatContext(),
 )
 
 # You can run this code to see the immediate checks working.

diff --git a/docs/examples/tutorial/context_example.py b/docs/examples/tutorial/context_example.py
@@ -1,9 +1,10 @@
-from mellea import LinearContext, start_session
+from mellea import start_session
+from mellea.stdlib.base import ChatContext
 
-m = start_session(ctx=LinearContext())
+m = start_session(ctx=ChatContext())
 m.chat("Make up a math problem.")
 m.chat("Solve your math problem.")
 
 print(m.ctx.last_output())
-
+print("==================")
 print(m.ctx.last_turn())
Original file line number	Diff line number	Diff line change
		@@ -1 +1 @@
		from .helpers import Any, fill, w
		from .helpers import req_print, w