OpenHands
diff --git a/‎.openhands/skills/code-review.md‎ ‎.agents/skills/code-review.md‎.openhands/skills/code-review.md renamed to .agents/skills/code-review.md
Lines changed: 4 additions & 1 deletion b/‎.openhands/skills/code-review.md‎ ‎.agents/skills/code-review.md‎.openhands/skills/code-review.md renamed to .agents/skills/code-review.md
Lines changed: 4 additions & 1 deletion
diff --git a/‎…ls/debug-test-examples-workflow/SKILL.md‎ ‎…ls/debug-test-examples-workflow/SKILL.md‎.openhands/skills/debug-test-examples-workflow/SKILL.md renamed to .agents/skills/debug-test-examples-workflow/SKILL.md b/‎…ls/debug-test-examples-workflow/SKILL.md‎ ‎…ls/debug-test-examples-workflow/SKILL.md‎.openhands/skills/debug-test-examples-workflow/SKILL.md renamed to .agents/skills/debug-test-examples-workflow/SKILL.md
diff --git a/‎.openhands/skills/run-eval.md‎ ‎.agents/skills/run-eval.md‎.openhands/skills/run-eval.md renamed to .agents/skills/run-eval.md b/‎.openhands/skills/run-eval.md‎ ‎.agents/skills/run-eval.md‎.openhands/skills/run-eval.md renamed to .agents/skills/run-eval.md
diff --git a/‎.openhands/skills/write-behavior-test.md‎ ‎.agents/skills/write-behavior-test.md‎.openhands/skills/write-behavior-test.md renamed to .agents/skills/write-behavior-test.md b/‎.openhands/skills/write-behavior-test.md‎ ‎.agents/skills/write-behavior-test.md‎.openhands/skills/write-behavior-test.md renamed to .agents/skills/write-behavior-test.md
diff --git a/‎.github/run-eval/resolve_model_config.py‎
Lines changed: 7 additions & 0 deletions b/‎.github/run-eval/resolve_model_config.py‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎.github/workflows/pr-review-by-openhands.yml‎
Lines changed: 6 additions & 5 deletions b/‎.github/workflows/pr-review-by-openhands.yml‎
Lines changed: 6 additions & 5 deletions
diff --git a/‎.github/workflows/server.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/server.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/todo-management.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/todo-management.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎AGENTS.md‎
Lines changed: 19 additions & 0 deletions b/‎AGENTS.md‎
Lines changed: 19 additions & 0 deletions
diff --git a/‎examples/01_standalone_sdk/38_browser_session_recording.py‎
Lines changed: 178 additions & 0 deletions b/‎examples/01_standalone_sdk/38_browser_session_recording.py‎
Lines changed: 178 additions & 0 deletions
@@ -15,9 +15,11 @@ You have permission to **APPROVE** or **COMMENT** on PRs. Do not use REQUEST_CHA
 
 **Default to APPROVE**: If your review finds no issues at "important" level or higher, approve the PR. Minor suggestions or nitpicks alone are not sufficient reason to withhold approval.
 
+**IMPORTANT: If you determine a PR is worth merging, you should approve it.** Don’t just say a PR is "worth merging" or "ready to merge" without actually submitting an approval. Your words and actions should be consistent.
+
 ### When to APPROVE
 
-Approve PRs that are straightforward and low-risk:
+Examples of straightforward and low-risk PRs you should approve (non-exhaustive):
 
 - **Configuration changes**: Adding models to config files, updating CI/workflow settings
 - **CI/Infrastructure changes**: Changing runner types, fixing workflow paths, updating job configurations
@@ -70,6 +72,7 @@ Do not leave comments for:
 - **Good behavior observed**: Don't comment just to praise code that follows best practices - this adds noise. Simply approve if the code is good.
 - **Suggestions for additional tests on simple changes**: For straightforward PRs (config changes, model additions, etc.), don't suggest adding test coverage unless tests are clearly missing for new logic
 - **Obvious or self-explanatory code**: Don't ask for comments on code that is already clear
+- **`.pr/` directory artifacts**: Files in the `.pr/` directory are temporary PR-specific documents (design notes, analysis, scripts) that are automatically cleaned up when the PR is approved. Do not comment on their presence or suggest removing them.
 
 If a PR is approvable, just approve it. Don't add "one small suggestion" or "consider doing X" comments that delay merging without adding real value.
 
 
@@ -145,6 +145,13 @@
             "disable_vision": True,
         },
     },
+    "glm-5": {
+        "id": "glm-5",
+        "display_name": "GLM-5",
+        "llm_config": {
+            "model": "litellm_proxy/openrouter/z-ai/glm-5",
+        },
+    },
     "qwen3-coder-next": {
         "id": "qwen3-coder-next",
         "display_name": "Qwen3 Coder Next",
 
@@ -8,7 +8,8 @@ on:
     #   2. A draft PR is marked as ready for review, OR
     #   3. A maintainer adds the 'review-this' label, OR
     #   4. A maintainer requests openhands-agent or all-hands-bot as a reviewer
-    # Only users with write access can add labels or request reviews, ensuring security.
+    # Adding labels and requesting new reviewers requires write access. GitHub may also allow PR authors
+    # to re-request review from a previous reviewer.
     # The PR code is explicitly checked out for review, but secrets are only accessible
     # because the workflow runs in the base repository context
     pull_request_target:
@@ -22,14 +23,14 @@ permissions:
 jobs:
     pr-review:
         # Run when one of the following conditions is met:
-        #   1. A new non-draft PR is opened by a trusted contributor, OR
-        #   2. A draft PR is converted to ready for review by a trusted contributor, OR
+        #   1. A new non-draft PR is opened by a non-first-time contributor, OR
+        #   2. A draft PR is converted to ready for review by a non-first-time contributor, OR
         #   3. 'review-this' label is added, OR
         #   4. openhands-agent or all-hands-bot is requested as a reviewer
         # Note: FIRST_TIME_CONTRIBUTOR PRs require manual trigger via label/reviewer request
         if: |
-            (github.event.action == 'opened' && github.event.pull_request.draft == false && github.event.pull_request.author_association != 'FIRST_TIME_CONTRIBUTOR') ||
-            (github.event.action == 'ready_for_review' && github.event.pull_request.author_association != 'FIRST_TIME_CONTRIBUTOR') ||
+            (github.event.action == 'opened' && github.event.pull_request.draft == false && github.event.pull_request.author_association != 'FIRST_TIME_CONTRIBUTOR' && github.event.pull_request.author_association != 'NONE') ||
+            (github.event.action == 'ready_for_review' && github.event.pull_request.author_association != 'FIRST_TIME_CONTRIBUTOR' && github.event.pull_request.author_association != 'NONE') ||
             github.event.label.name == 'review-this' ||
             github.event.requested_reviewer.login == 'openhands-agent' ||
             github.event.requested_reviewer.login == 'all-hands-bot'
 
@@ -708,7 +708,7 @@ jobs:
                       echo 'EOF'
                   } >> $GITHUB_OUTPUT
 
-            - name: Update PR description with comprehensive docker information
+            - name: Update PR description with docker image details
               uses: nefrob/pr-description@v1.2.0
               with:
                   content: ${{ steps.generate_description.outputs.pr_content }}
 
@@ -219,7 +219,7 @@ jobs:
                   echo "Available files:"
                   ls -la
 
-                  # Run the agent with comprehensive logging
+                  # Run the agent with detailed logging
                   echo "Starting agent execution..."
                   set +e  # Don't exit on error, we want to capture it
                   uv run python agent.py "$TODO_JSON" 2>&1 | tee agent_output.log
 
@@ -116,6 +116,10 @@ When reviewing code, provide constructive feedback:
 - If it is a single-line string, you can break it into a multi-line string by doing "ABC" -> ("A"\n"B"\n"C")
 - If it is a long multi-line string (e.g., docstring), you should just add type ignore AFTER the ending """. You should NEVER ADD IT INSIDE the docstring.
 
+# PyInstaller Data Files
+
+When adding non-Python files (JS, templates, etc.) loaded at runtime, add them to `openhands-agent-server/openhands/agent_server/agent-server.spec` using `collect_data_files`.
+
 </DEV_SETUP>
 
 <PR_ARTIFACTS>
@@ -280,6 +284,21 @@ git push -u origin <feature-name>
 ```
 </DOCUMENTATION_WORKFLOW>
 
+<AGENT_TMP_DIRECTORY>
+# Agent Temporary Directory Convention
+
+When tools need to store observation files (e.g., browser session recordings, task tracker data), use `.agent_tmp` as the directory name for consistency.
+
+The browser session recording tool saves recordings to `.agent_tmp/observations/recording-{timestamp}/`.
+
+This convention ensures tool-generated observation files are stored in a predictable location that can be easily:
+- Added to `.gitignore`
+- Cleaned up after agent sessions
+- Identified as agent-generated artifacts
+
+Note: This is separate from `persistence_dir` which is used for conversation state persistence.
+</AGENT_TMP_DIRECTORY>
+
 <REPO>
 <PROJECT_STRUCTURE>
 - `openhands-sdk/` core SDK; `openhands-tools/` built-in tools; `openhands-workspace/` workspace management; `openhands-agent-server/` server runtime; `examples/` runnable patterns; `tests/` split by domain (`tests/sdk`, `tests/tools`, `tests/agent_server`, etc.).
 
@@ -0,0 +1,178 @@
+"""Browser Session Recording Example
+
+This example demonstrates how to use the browser session recording feature
+to capture and save a recording of the agent's browser interactions using rrweb.
+
+The recording can be replayed later using rrweb-player to visualize the agent's
+browsing session.
+
+The recording will be automatically saved to the persistence directory when
+browser_stop_recording is called. You can replay it with:
+    - rrweb-player: https://github.com/rrweb-io/rrweb/tree/master/packages/rrweb-player
+    - Online viewer: https://www.rrweb.io/demo/
+"""
+
+import json
+import os
+
+from pydantic import SecretStr
+
+from openhands.sdk import (
+    LLM,
+    Agent,
+    Conversation,
+    Event,
+    LLMConvertibleEvent,
+    get_logger,
+)
+from openhands.sdk.tool import Tool
+from openhands.tools.browser_use import BrowserToolSet
+from openhands.tools.browser_use.definition import BROWSER_RECORDING_OUTPUT_DIR
+
+
+logger = get_logger(__name__)
+
+# Configure LLM
+api_key = os.getenv("LLM_API_KEY")
+assert api_key is not None, "LLM_API_KEY environment variable is not set."
+model = os.getenv("LLM_MODEL", "anthropic/claude-sonnet-4-5-20250929")
+base_url = os.getenv("LLM_BASE_URL")
+llm = LLM(
+    usage_id="agent",
+    model=model,
+    base_url=base_url,
+    api_key=SecretStr(api_key),
+)
+
+# Tools - including browser tools with recording capability
+cwd = os.getcwd()
+tools = [
+    Tool(name=BrowserToolSet.name),
+]
+
+# Agent
+agent = Agent(llm=llm, tools=tools)
+
+llm_messages = []  # collect raw LLM messages
+
+
+def conversation_callback(event: Event):
+    if isinstance(event, LLMConvertibleEvent):
+        llm_messages.append(event.to_llm_message())
+
+
+# Create conversation with persistence_dir set to save browser recordings
+conversation = Conversation(
+    agent=agent,
+    callbacks=[conversation_callback],
+    workspace=cwd,
+    persistence_dir="./.conversations",
+)
+
+# The prompt instructs the agent to:
+# 1. Start recording the browser session
+# 2. Browse to a website and perform some actions
+# 3. Stop recording (auto-saves to file)
+PROMPT = """
+Please complete the following task to demonstrate browser session recording:
+
+1. First, use `browser_start_recording` to begin recording the browser session.
+
+2. Then navigate to https://docs.openhands.dev/ and:
+   - Get the page content
+   - Scroll down the page
+   - Get the browser state to see interactive elements
+
+3. Next, navigate to https://docs.openhands.dev/openhands/usage/cli/installation and:
+   - Get the page content
+   - Scroll down to see more content
+
+4. Finally, use `browser_stop_recording` to stop the recording.
+   Events are automatically saved.
+"""
+
+print("=" * 80)
+print("Browser Session Recording Example")
+print("=" * 80)
+print("\nTask: Record an agent's browser session and save it for replay")
+print("\nStarting conversation with agent...\n")
+
+conversation.send_message(PROMPT)
+conversation.run()
+
+print("\n" + "=" * 80)
+print("Conversation finished!")
+print("=" * 80)
+
+# Check if the recording files were created
+# Recordings are saved in BROWSER_RECORDING_OUTPUT_DIR/recording-{timestamp}/
+if os.path.exists(BROWSER_RECORDING_OUTPUT_DIR):
+    # Find recording subdirectories (they start with "recording-")
+    recording_dirs = sorted(
+        [
+            d
+            for d in os.listdir(BROWSER_RECORDING_OUTPUT_DIR)
+            if d.startswith("recording-")
+            and os.path.isdir(os.path.join(BROWSER_RECORDING_OUTPUT_DIR, d))
+        ]
+    )
+
+    if recording_dirs:
+        # Process the most recent recording directory
+        latest_recording = recording_dirs[-1]
+        recording_path = os.path.join(BROWSER_RECORDING_OUTPUT_DIR, latest_recording)
+        json_files = sorted(
+            [f for f in os.listdir(recording_path) if f.endswith(".json")]
+        )
+
+        print(f"\n✓ Recording saved to: {recording_path}")
+        print(f"✓ Number of files: {len(json_files)}")
+
+        # Count total events across all files
+        total_events = 0
+        all_event_types: dict[int | str, int] = {}
+        total_size = 0
+
+        for json_file in json_files:
+            filepath = os.path.join(recording_path, json_file)
+            file_size = os.path.getsize(filepath)
+            total_size += file_size
+
+            with open(filepath) as f:
+                events = json.load(f)
+
+            # Events are stored as a list in each file
+            if isinstance(events, list):
+                total_events += len(events)
+                for event in events:
+                    event_type = event.get("type", "unknown")
+                    all_event_types[event_type] = all_event_types.get(event_type, 0) + 1
+
+            print(f"  - {json_file}: {len(events)} events, {file_size} bytes")
+
+        print(f"✓ Total events: {total_events}")
+        print(f"✓ Total size: {total_size} bytes")
+        if all_event_types:
+            print(f"✓ Event types: {all_event_types}")
+
+        print("\nTo replay this recording, you can use:")
+        print(
+            "  - rrweb-player: "
+            "https://github.com/rrweb-io/rrweb/tree/master/packages/rrweb-player"
+        )
+    else:
+        print(f"\n✗ No recording directories found in: {BROWSER_RECORDING_OUTPUT_DIR}")
+        print("  The agent may not have completed the recording task.")
+else:
+    print(f"\n✗ Observations directory not found: {BROWSER_RECORDING_OUTPUT_DIR}")
+    print("  The agent may not have completed the recording task.")
+
+print("\n" + "=" * 100)
+print("Conversation finished.")
+print(f"Total LLM messages: {len(llm_messages)}")
+print("=" * 100)
+
+# Report cost
+cost = conversation.conversation_stats.get_combined_metrics().accumulated_cost
+print(f"Conversation ID: {conversation.id}")
+print(f"EXAMPLE_COST: {cost}")