dpatou · dpatou · Dec 28, 2025
diff --git a/README.md b/README.md
@@ -175,6 +175,8 @@ Options:
 - `--dry-run` - show what would be converted without creating files
 - `--open` - open the generated archive in your default browser
 - `-q, --quiet` - suppress all output except errors
+- `-m, --merge` - merge with existing archive (preserve orphan sessions)
+- `--prefix NAME` - prefix for sessions in index (e.g., machine name)
 
 Examples:
 
@@ -192,6 +194,28 @@ claude-code-transcripts all -o ./my-archive
 claude-code-transcripts all --include-agents
 ```
 
+### Merging archives from multiple machines
+
+Use `-m`/`--merge` to combine sessions from different machines into a single archive:
+
+```bash
+# Machine A: create initial archive
+claude-code-transcripts all -o /shared/archive
+
+# Machine B: merge additional sessions
+claude-code-transcripts all -o /shared/archive -m
+
+# With prefix (shown in index)
+claude-code-transcripts all -o /shared/archive --merge --prefix=laptop
+```
+
+The `--merge` option:
+- Regenerates all sessions found in the source directory
+- Preserves "orphan" sessions in the archive that are no longer in the source
+- Useful for maintaining a unified archive from multiple machines
+
+The `--prefix` option adds a label to sessions in the index, helping identify which machine they came from.
+
 ## Development
 
 To contribute to this tool, first checkout the code. You can run the tests using `uv run`:

diff --git a/src/claude_code_transcripts/__init__.py b/src/claude_code_transcripts/__init__.py
@@ -303,8 +303,179 @@ def find_all_sessions(folder, include_agents=False):
     return result
 
 
+def find_existing_sessions(output_dir):
+    """Find existing sessions in an output archive directory.
+
+    Scans the output directory structure to find already-generated sessions.
+    Returns a list of project dicts in the same format as find_all_sessions().
+
+    Args:
+        output_dir: Path to the archive directory (e.g., ./claude-archive)
+
+    Returns:
+        List of project dicts: [{"name": str, "path": None, "sessions": [...]}]
+        Session dicts contain: path (session dir), summary, mtime, size
+    """
+    output_dir = Path(output_dir)
+    if not output_dir.exists():
+        return []
+
+    # Regex patterns to extract session info from project index HTML
+    session_pattern = re.compile(
+        r'<a href="([^"]+)/index\.html">\s*'
+        r'<div class="index-item-header">\s*'
+        r'<span class="index-item-number">([^<]+)</span>\s*'
+        r"<span[^>]*>([^<]+)</span>\s*"
+        r"</div>\s*"
+        r'<div class="index-item-content">\s*'
+        r"<p[^>]*>([^<]*)",
+        re.DOTALL,
+    )
+
+    projects = []
+
+    # Iterate over subdirectories (projects)
+    for project_dir in output_dir.iterdir():
+        if not project_dir.is_dir():
+            continue
+        # Skip if it's the master index.html in root
+        if project_dir.name == "index.html":
+            continue
+
+        project_index = project_dir / "index.html"
+        if not project_index.exists():
+            continue
+
+        # Parse project index HTML
+        html_content = project_index.read_text()
+        sessions = []
+
+        for match in session_pattern.finditer(html_content):
+            session_name = match.group(1)
+            # date = match.group(2)  # Not used currently
+            # size_str = match.group(3)  # e.g., "15 KB"
+            summary = match.group(4).strip()
+            # Handle truncated summaries (ending with ...)
+            if summary.endswith("..."):
+                summary = summary[:-3]
+
+            session_dir = project_dir / session_name
+            if not session_dir.exists() or not session_dir.is_dir():
+                continue
+
+            # Get mtime from session directory
+            try:
+                mtime = session_dir.stat().st_mtime
+            except OSError:
+                mtime = 0
+
+            # Calculate size as sum of HTML files in session
+            size = sum(
+                f.stat().st_size
+                for f in session_dir.iterdir()
+                if f.is_file() and f.suffix == ".html"
+            )
+
+            sessions.append(
+                {
+                    "path": session_dir,
+                    "summary": summary,
+                    "mtime": mtime,
+                    "size": size,
+                }
+            )
+
+        if sessions:
+            # Sort sessions by mtime (most recent first)
+            sessions.sort(key=lambda s: s["mtime"], reverse=True)
+            projects.append(
+                {
+                    "name": project_dir.name,
+                    "path": None,  # No source path for existing sessions
+                    "sessions": sessions,
+                }
+            )
+
+    # Sort projects by most recent session
+    projects.sort(
+        key=lambda p: p["sessions"][0]["mtime"] if p["sessions"] else 0, reverse=True
+    )
+
+    return projects
+
+
+def merge_sessions(source_sessions, existing_sessions):
+    """Merge sessions from source with existing archive.
+
+    All source sessions will be (re)generated.
+    Sessions only in existing archive are preserved in the merged index.
+
+    Args:
+        source_sessions: Projects from find_all_sessions() (new/updated)
+        existing_sessions: Projects from find_existing_sessions()
+
+    Returns:
+        merged_projects: Combined list for index generation (source + orphans)
+    """
+    # Build lookup of existing sessions by (project_name, session_stem)
+    existing_lookup = {}
+    for project in existing_sessions:
+        for session in project["sessions"]:
+            # Get session stem (filename without extension for source, dir name for existing)
+            session_stem = (
+                session["path"].stem if session["path"].suffix else session["path"].name
+            )
+            existing_lookup[(project["name"], session_stem)] = session
+
+    # Build merged projects dict
+    merged = {}
+
+    # Add all source sessions (they will be regenerated)
+    for project in source_sessions:
+        project_name = project["name"]
+        if project_name not in merged:
+            merged[project_name] = {
+                "name": project_name,
+                "path": project.get("path"),
+                "sessions": [],
+            }
+
+        for session in project["sessions"]:
+            session_stem = session["path"].stem
+            # Mark this session as "from source" so we know it's not orphan
+            existing_lookup.pop((project_name, session_stem), None)
+            merged[project_name]["sessions"].append(session)
+
+    # Add orphaned sessions (only in existing, not in source)
+    for (project_name, session_stem), session in existing_lookup.items():
+        if project_name not in merged:
+            merged[project_name] = {
+                "name": project_name,
+                "path": None,
+                "sessions": [],
+            }
+        merged[project_name]["sessions"].append(session)
+
+    # Sort sessions within each project by mtime (most recent first)
+    for project in merged.values():
+        project["sessions"].sort(key=lambda s: s["mtime"], reverse=True)
+
+    # Convert to list and sort projects by most recent session
+    result = list(merged.values())
+    result.sort(
+        key=lambda p: p["sessions"][0]["mtime"] if p["sessions"] else 0, reverse=True
+    )
+
+    return result
+
+
 def generate_batch_html(
-    source_folder, output_dir, include_agents=False, progress_callback=None
+    source_folder,
+    output_dir,
+    include_agents=False,
+    progress_callback=None,
+    merge=False,
+    prefix=None,
 ):
     """Generate HTML archive for all sessions in a Claude projects folder.
 
@@ -319,24 +490,39 @@ def generate_batch_html(
         include_agents: Whether to include agent-* session files
         progress_callback: Optional callback(project_name, session_name, current, total)
             called after each session is processed
+        merge: If True, preserve orphan sessions from existing archive in the index
+        prefix: Optional prefix to display for sessions in the index (e.g., machine name)
 
     Returns statistics dict with total_projects, total_sessions, failed_sessions, output_dir.
     """
     source_folder = Path(source_folder)
     output_dir = Path(output_dir)
     output_dir.mkdir(parents=True, exist_ok=True)
 
-    # Find all sessions
-    projects = find_all_sessions(source_folder, include_agents=include_agents)
+    # Find all sessions from source
+    source_projects = find_all_sessions(source_folder, include_agents=include_agents)
+
+    # Add prefix to source sessions if specified
+    if prefix:
+        for project in source_projects:
+            for session in project["sessions"]:
+                session["prefix"] = prefix
 
-    # Calculate total for progress tracking
-    total_session_count = sum(len(p["sessions"]) for p in projects)
+    # Determine projects for index generation
+    if merge and output_dir.exists():
+        existing_projects = find_existing_sessions(output_dir)
+        projects_for_index = merge_sessions(source_projects, existing_projects)
+    else:
+        projects_for_index = source_projects
+
+    # Calculate total for progress tracking (only source sessions are generated)
+    total_session_count = sum(len(p["sessions"]) for p in source_projects)
     processed_count = 0
     successful_sessions = 0
     failed_sessions = []
 
-    # Process each project
-    for project in projects:
+    # Process each source project (generate HTML for source sessions only)
+    for project in source_projects:
         project_dir = output_dir / project["name"]
         project_dir.mkdir(exist_ok=True)
 
@@ -366,14 +552,17 @@ def generate_batch_html(
                     project["name"], session_name, processed_count, total_session_count
                 )
 
-        # Generate project index
+    # Generate project indexes (using merged projects if applicable)
+    for project in projects_for_index:
+        project_dir = output_dir / project["name"]
+        project_dir.mkdir(exist_ok=True)
         _generate_project_index(project, project_dir)
 
     # Generate master index
-    _generate_master_index(projects, output_dir)
+    _generate_master_index(projects_for_index, output_dir)
 
     return {
-        "total_projects": len(projects),
+        "total_projects": len(projects_for_index),
         "total_sessions": successful_sessions,
         "failed_sessions": failed_sessions,
         "output_dir": output_dir,
@@ -388,14 +577,20 @@ def _generate_project_index(project, output_dir):
     sessions_data = []
     for session in project["sessions"]:
         mod_time = datetime.fromtimestamp(session["mtime"])
-        sessions_data.append(
-            {
-                "name": session["path"].stem,
-                "summary": session["summary"],
-                "date": mod_time.strftime("%Y-%m-%d %H:%M"),
-                "size_kb": session["size"] / 1024,
-            }
+        # Get session name: stem for files, name for directories
+        session_name = (
+            session["path"].stem if session["path"].suffix else session["path"].name
         )
+        session_entry = {
+            "name": session_name,
+            "summary": session["summary"],
+            "date": mod_time.strftime("%Y-%m-%d %H:%M"),
+            "size_kb": session["size"] / 1024,
+        }
+        # Add prefix if present
+        if "prefix" in session:
+            session_entry["prefix"] = session["prefix"]
+        sessions_data.append(session_entry)
 
     html_content = template.render(
         project_name=project["name"],
@@ -1927,7 +2122,21 @@ def web_cmd(
     is_flag=True,
     help="Suppress all output except errors.",
 )
-def all_cmd(source, output, include_agents, dry_run, open_browser, quiet):
+@click.option(
+    "-m",
+    "--merge",
+    is_flag=True,
+    help="Merge with existing archive: regenerate source sessions, preserve orphans in index.",
+)
+@click.option(
+    "--prefix",
+    type=str,
+    default=None,
+    help="Prefix for sessions in index (e.g., --prefix=laptop).",
+)
+def all_cmd(
+    source, output, include_agents, dry_run, open_browser, quiet, merge, prefix
+):
     """Convert all local Claude Code sessions to a browsable HTML archive.
 
     Creates a directory structure with:
@@ -1993,6 +2202,8 @@ def on_progress(project_name, session_name, current, total):
         output,
         include_agents=include_agents,
         progress_callback=on_progress,
+        merge=merge,
+        prefix=prefix,
     )
 
     # Report any failures

diff --git a/src/claude_code_transcripts/templates/project_index.html b/src/claude_code_transcripts/templates/project_index.html
@@ -10,7 +10,7 @@ <h1><a href="../index.html" style="color: inherit; text-decoration: none;">Claud
         <div class="index-item">
             <a href="{{ session.name }}/index.html">
                 <div class="index-item-header">
-                    <span class="index-item-number">{{ session.date }}</span>
+                    <span class="index-item-number">{% if session.prefix %}<span style="color: var(--tool-border); font-weight: 600;">[{{ session.prefix }}]</span> {% endif %}{{ session.date }}</span>
                     <span style="color: var(--text-muted);">{{ "%.0f"|format(session.size_kb) }} KB</span>
                 </div>
                 <div class="index-item-content">