Merge pull request #80 from claytonlin1110/feat/batch-generation-manifest

dippatel1994 · web-flow · commit 90fb00903468 · 2026-03-09T10:36:15.000-04:00
feat: add batch generation from YAML/JSON manifest
diff --git a/README.md b/README.md
@@ -39,6 +39,7 @@ An agentic framework for generating publication-quality academic diagrams and st
 - Input optimization layer for better generation quality
 - Auto-refine mode and run continuation with user feedback
 - CLI, Python API, and MCP server for IDE integration
+- **Batch generation** from a manifest file (YAML/JSON) for multiple diagrams in one run
 - Claude Code skills for `/generate-diagram`, `/generate-plot`, and `/evaluate-diagram`
 
 <p align="center">
@@ -205,6 +206,39 @@ paperbanana plot \
 | `--output` | `-o` | Output image path |
 | `--iterations` | `-n` | Refinement iterations (default: 3) |
 
+### `paperbanana batch` -- Batch Generation
+
+Generate multiple methodology diagrams from a single manifest file (YAML or JSON). Each item runs the full pipeline; outputs are written under `outputs/batch_<id>/run_<id>/` and a `batch_report.json` summarizes all runs.
+
+```bash
+paperbanana batch --manifest examples/batch_manifest.yaml --optimize
+```
+
+Manifest format (YAML or JSON with an `items` list):
+
+```yaml
+items:
+  - input: path/to/method1.txt
+    caption: "Overview of our encoder-decoder"
+    id: fig1
+  - input: method2.txt
+    caption: "Training pipeline"
+    id: fig2
+```
+
+Paths in the manifest are resolved relative to the manifest file's directory.
+
+| Flag | Short | Description |
+|------|-------|-------------|
+| `--manifest` | `-m` | Path to manifest file (required) |
+| `--output-dir` | `-o` | Parent directory for batch run (default: outputs) |
+| `--config` | | Path to config YAML |
+| `--iterations` | `-n` | Refinement iterations per item |
+| `--optimize` | | Preprocess inputs for each item |
+| `--auto` | | Loop until critic satisfied per item |
+| `--format` | `-f` | Output image format (png, jpeg, webp) |
+| `--auto-download-data` | | Download expanded reference set if needed |
+
 ### `paperbanana evaluate` -- Quality Assessment
 
 Comparative evaluation of a generated diagram against a human reference using VLM-as-a-Judge:
diff --git a/examples/batch_manifest.yaml b/examples/batch_manifest.yaml
@@ -0,0 +1,11 @@
+# Batch manifest example: generate multiple methodology diagrams.
+# Paths are relative to this file's directory.
+# Run: paperbanana batch --manifest examples/batch_manifest.yaml
+
+items:
+  - input: sample_inputs/transformer_method.txt
+    caption: "Overview of the Transformer encoder-decoder architecture with multi-head attention"
+    id: transformer
+  - input: sample_inputs/mamba_method.txt
+    caption: "Mamba block with selective state space and gating"
+    id: mamba
diff --git a/paperbanana/cli.py b/paperbanana/cli.py
@@ -467,6 +467,189 @@ async def _critic_run(*a, **kw):
     console.print(f"  Run ID: [dim]{result.metadata.get('run_id', 'unknown')}[/dim]")
 
 
+@app.command()
+def batch(
+    manifest: str = typer.Option(
+        ..., "--manifest", "-m", help="Path to batch manifest (YAML or JSON)"
+    ),
+    output_dir: str = typer.Option(
+        "outputs",
+        "--output-dir",
+        "-o",
+        help="Parent directory for batch run (batch_<id> will be created here)",
+    ),
+    config: Optional[str] = typer.Option(None, "--config", help="Path to config YAML file"),
+    vlm_provider: Optional[str] = typer.Option(None, "--vlm-provider", help="VLM provider"),
+    vlm_model: Optional[str] = typer.Option(None, "--vlm-model", help="VLM model name"),
+    image_provider: Optional[str] = typer.Option(
+        None, "--image-provider", help="Image gen provider"
+    ),
+    image_model: Optional[str] = typer.Option(None, "--image-model", help="Image gen model name"),
+    iterations: Optional[int] = typer.Option(
+        None, "--iterations", "-n", help="Refinement iterations"
+    ),
+    auto: bool = typer.Option(
+        False, "--auto", help="Loop until critic satisfied (with safety cap)"
+    ),
+    max_iterations: Optional[int] = typer.Option(
+        None, "--max-iterations", help="Safety cap for --auto"
+    ),
+    optimize: bool = typer.Option(
+        False, "--optimize", help="Preprocess inputs for better generation"
+    ),
+    format: str = typer.Option(
+        "png", "--format", "-f", help="Output image format (png, jpeg, webp)"
+    ),
+    save_prompts: Optional[bool] = typer.Option(
+        None, "--save-prompts/--no-save-prompts", help="Save prompts per run"
+    ),
+    auto_download_data: bool = typer.Option(
+        False, "--auto-download-data", help="Auto-download reference set if needed"
+    ),
+    verbose: bool = typer.Option(False, "--verbose", "-v", help="Show detailed progress"),
+):
+    """Generate multiple methodology diagrams from a manifest file (YAML or JSON)."""
+    if format not in ("png", "jpeg", "webp"):
+        console.print(f"[red]Error: Format must be png, jpeg, or webp. Got: {format}[/red]")
+        raise typer.Exit(1)
+
+    configure_logging(verbose=verbose)
+    manifest_path = Path(manifest)
+    if not manifest_path.exists():
+        console.print(f"[red]Error: Manifest not found: {manifest}[/red]")
+        raise typer.Exit(1)
+
+    from paperbanana.core.batch import generate_batch_id, load_batch_manifest
+    from paperbanana.core.utils import ensure_dir, save_json
+
+    try:
+        items = load_batch_manifest(manifest_path)
+    except (ValueError, FileNotFoundError, RuntimeError) as e:
+        console.print(f"[red]Error loading manifest: {e}[/red]")
+        raise typer.Exit(1)
+
+    batch_id = generate_batch_id()
+    batch_dir = Path(output_dir) / batch_id
+    ensure_dir(batch_dir)
+
+    overrides = {"output_dir": str(batch_dir), "output_format": format}
+    if vlm_provider:
+        overrides["vlm_provider"] = vlm_provider
+    if vlm_model:
+        overrides["vlm_model"] = vlm_model
+    if image_provider:
+        overrides["image_provider"] = image_provider
+    if image_model:
+        overrides["image_model"] = image_model
+    if iterations is not None:
+        overrides["refinement_iterations"] = iterations
+    if auto:
+        overrides["auto_refine"] = True
+    if max_iterations is not None:
+        overrides["max_iterations"] = max_iterations
+    if optimize:
+        overrides["optimize_inputs"] = True
+    if save_prompts is not None:
+        overrides["save_prompts"] = save_prompts
+
+    if config:
+        settings = Settings.from_yaml(config, **overrides)
+    else:
+        from dotenv import load_dotenv
+
+        load_dotenv()
+        settings = Settings(**overrides)
+
+    if auto_download_data:
+        from paperbanana.data.manager import DatasetManager
+
+        dm = DatasetManager(cache_dir=settings.cache_dir)
+        if not dm.is_downloaded():
+            console.print("  [dim]Downloading expanded reference set...[/dim]")
+            try:
+                dm.download()
+            except Exception as e:
+                console.print(f"  [yellow]Download failed: {e}, using built-in set[/yellow]")
+
+    console.print(
+        Panel.fit(
+            f"[bold]PaperBanana[/bold] — Batch Generation\n\n"
+            f"Manifest: {manifest_path.name}\n"
+            f"Items: {len(items)}\n"
+            f"Output: {batch_dir}",
+            border_style="blue",
+        )
+    )
+    console.print()
+
+    from paperbanana.core.pipeline import PaperBananaPipeline
+
+    report = {"batch_id": batch_id, "manifest": str(manifest_path), "items": []}
+    total_start = time.perf_counter()
+
+    for idx, item in enumerate(items):
+        item_id = item["id"]
+        input_path = Path(item["input"])
+        if not input_path.exists():
+            console.print(f"[red]Skipping item '{item_id}': input not found: {input_path}[/red]")
+            report["items"].append(
+                {
+                    "id": item_id,
+                    "input": item["input"],
+                    "caption": item["caption"],
+                    "run_id": None,
+                    "output_path": None,
+                    "error": "input file not found",
+                }
+            )
+            continue
+        source_context = input_path.read_text(encoding="utf-8")
+        gen_input = GenerationInput(
+            source_context=source_context,
+            communicative_intent=item["caption"],
+            diagram_type=DiagramType.METHODOLOGY,
+        )
+        console.print(f"[bold]Item {idx + 1}/{len(items)}[/bold] — {item_id}")
+        pipeline = PaperBananaPipeline(settings=settings)
+        try:
+            result = asyncio.run(pipeline.generate(gen_input))
+            report["items"].append(
+                {
+                    "id": item_id,
+                    "input": item["input"],
+                    "caption": item["caption"],
+                    "run_id": result.metadata.get("run_id"),
+                    "output_path": result.image_path,
+                    "iterations": len(result.iterations),
+                }
+            )
+            console.print(f"  [green]✓[/green] [dim]{result.image_path}[/dim]\n")
+        except Exception as e:
+            console.print(f"  [red]✗[/red] {e}\n")
+            report["items"].append(
+                {
+                    "id": item_id,
+                    "input": item["input"],
+                    "caption": item["caption"],
+                    "run_id": None,
+                    "output_path": None,
+                    "error": str(e),
+                }
+            )
+
+    total_elapsed = time.perf_counter() - total_start
+    report["total_seconds"] = round(total_elapsed, 1)
+    report_path = batch_dir / "batch_report.json"
+    save_json(report, report_path)
+
+    succeeded = sum(1 for x in report["items"] if x.get("output_path"))
+    console.print(
+        f"[green]Batch complete.[/green] [dim]{total_elapsed:.1f}s · "
+        f"{succeeded}/{len(items)} succeeded[/dim]"
+    )
+    console.print(f"  Report: [bold]{report_path}[/bold]")
+
+
 @app.command()
 def plot(
     data: str = typer.Option(..., "--data", "-d", help="Path to data file (CSV or JSON)"),
diff --git a/paperbanana/core/batch.py b/paperbanana/core/batch.py
@@ -0,0 +1,81 @@
+"""Batch generation: manifest loading and batch run id."""
+
+from __future__ import annotations
+
+import datetime
+import uuid
+from pathlib import Path
+from typing import Any
+
+import structlog
+
+logger = structlog.get_logger()
+
+
+def generate_batch_id() -> str:
+    """Generate a unique batch run ID."""
+    ts = datetime.datetime.now().strftime("%Y%m%d_%H%M%S")
+    short_uuid = uuid.uuid4().hex[:6]
+    return f"batch_{ts}_{short_uuid}"
+
+
+def load_batch_manifest(manifest_path: Path) -> list[dict[str, Any]]:
+    """Load a batch manifest (YAML or JSON) and return a list of items.
+
+    Each item is a dict with:
+      - input: path to methodology text file (resolved relative to manifest parent)
+      - caption: figure caption / communicative intent
+      - id: optional string identifier for the item (default: index-based)
+
+    Paths in the manifest are resolved relative to the manifest file's directory.
+    """
+    manifest_path = Path(manifest_path).resolve()
+    if not manifest_path.exists():
+        raise FileNotFoundError(f"Manifest not found: {manifest_path}")
+    parent = manifest_path.parent
+    raw = manifest_path.read_text(encoding="utf-8")
+    suffix = manifest_path.suffix.lower()
+    if suffix in (".yaml", ".yml"):
+        try:
+            import yaml
+
+            data = yaml.safe_load(raw)
+        except ImportError:
+            raise RuntimeError(
+                "PyYAML is required for YAML manifests. Install with: pip install pyyaml"
+            )
+    elif suffix == ".json":
+        import json
+
+        data = json.loads(raw)
+    else:
+        raise ValueError(f"Manifest must be .yaml, .yml, or .json. Got: {manifest_path.suffix}")
+
+    if data is None:
+        raise ValueError("Manifest is empty")
+    if isinstance(data, list):
+        items = data
+    elif isinstance(data, dict) and "items" in data:
+        items = data["items"]
+    else:
+        raise ValueError("Manifest must be a list of items or an object with an 'items' list")
+
+    result = []
+    for i, entry in enumerate(items):
+        if not isinstance(entry, dict):
+            raise ValueError(f"Manifest item {i} must be an object, got {type(entry).__name__}")
+        inp = entry.get("input")
+        caption = entry.get("caption")
+        if not inp or not caption:
+            raise ValueError(f"Manifest item {i}: 'input' and 'caption' are required")
+        input_path = Path(inp)
+        if not input_path.is_absolute():
+            input_path = (parent / input_path).resolve()
+        result.append(
+            {
+                "input": str(input_path),
+                "caption": str(caption),
+                "id": entry.get("id", f"item_{i + 1}"),
+            }
+        )
+    return result