Xtra-Computing
diff --git a/‎configs/OpenRouter_llm_list.txt‎
Lines changed: 10 additions & 0 deletions b/‎configs/OpenRouter_llm_list.txt‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 1 addition & 1 deletion b/‎pyproject.toml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎scripts/calc_dna.py‎
Lines changed: 51 additions & 4 deletions b/‎scripts/calc_dna.py‎
Lines changed: 51 additions & 4 deletions
@@ -0,0 +1,10 @@
+openrouter/pony-alpha
+anthropic/claude-opus-4.6
+anthropic/claude-sonnet-4.5
+z-ai/glm-4.7
+google/gemini-3-pro-preview
+google/gemini-3-flash-preview
+deepseek/deepseek-v3.2
+openai/gpt-5.2-codex
+openai/gpt-5.2
+x-ai/grok-4.1-fast
@@ -1,6 +1,6 @@
 [project]
 name = "reptrace"
-version = "0.1.1b1"
+version = "0.1.2b1"
 description = "Extract LLM DNA vectors — low-dimensional representations that capture functional behavior and model evolution."
 authors = [{ name = "RepTrace Project" }]
 license = { file = "LICENSE" }
 
@@ -6,6 +6,7 @@
     python scripts/calc_dna.py
     python scripts/calc_dna.py --model Qwen/Qwen2.5-0.5B-Instruct
     python scripts/calc_dna.py --model distilgpt2 --gpu 0 --samples 50
+    python scripts/calc_dna.py --llm-list ./configs/llm_list.txt --gpus 0,1
 """
 
 import argparse
@@ -18,7 +19,7 @@
 if str(SRC) not in sys.path:
     sys.path.insert(0, str(SRC))
 
-from reptrace import DNAExtractionConfig, calc_dna
+from reptrace import DNAExtractionConfig, calc_dna, calc_dna_parallel
 
 
 def main():
@@ -30,7 +31,13 @@ def main():
         "--model", 
         type=str, 
         default="distilgpt2",
-        help="Model name or Hugging Face model ID"
+        help="Model name or Hugging Face model ID (ignored if --llm-list is provided)"
+    )
+    parser.add_argument(
+        "--llm-list",
+        type=Path,
+        default=None,
+        help="Path to file containing model names (one per line) for batch processing"
     )
     parser.add_argument(
         "--dataset",
@@ -42,14 +49,25 @@ def main():
         "--gpu",
         type=int,
         default=None,
-        help="GPU ID to use (None for CPU)"
+        help="GPU ID to use for single model (None for CPU)"
+    )
+    parser.add_argument(
+        "--gpus",
+        type=str,
+        default=None,
+        help="Comma-separated GPU IDs for batch mode (e.g., '0,1,2')"
     )
     parser.add_argument(
         "--samples",
         type=int,
         default=100,
         help="Number of probe samples to use for DNA extraction"
     )
+    parser.add_argument(
+        "--continue-on-error",
+        action="store_true",
+        help="Continue processing remaining models if one fails (batch mode only)"
+    )
     parser.add_argument(
         "--no-save",
         action="store_true",
@@ -62,6 +80,11 @@ def main():
     data_root = str(ROOT / "data")
     output_dir = ROOT / "out"
 
+    # Parse GPU IDs for batch mode
+    gpu_ids = None
+    if args.gpus:
+        gpu_ids = [int(g.strip()) for g in args.gpus.split(",") if g.strip()]
+
     # Create configuration using the public API
     config = DNAExtractionConfig(
         model_name=args.model,
@@ -75,7 +98,30 @@ def main():
         trust_remote_code=True,
     )
 
-    # Extract DNA
+    # Batch mode: process multiple models from file
+    if args.llm_list:
+        print(f"Batch processing models from: {args.llm_list}")
+        print(f"Using {args.samples} probe samples per model")
+        if gpu_ids:
+            print(f"GPUs: {gpu_ids}")
+        
+        results = calc_dna_parallel(
+            config=config,
+            llm_list=args.llm_list,
+            gpu_ids=gpu_ids,
+            continue_on_error=args.continue_on_error,
+        )
+        
+        # Display batch results
+        print(f"\n{'='*60}")
+        print(f"Processed {len(results)} model(s):")
+        for result in results:
+            print(f"  - {result.model_name}: shape={result.vector.shape}, time={result.elapsed_seconds:.2f}s")
+            if result.output_path:
+                print(f"    Saved to: {result.output_path}")
+        return 0
+
+    # Single model mode
     print(f"Extracting DNA from: {args.model}")
     print(f"Using {args.samples} probe samples")
     result = calc_dna(config)
@@ -94,3 +140,4 @@ def main():
 
 if __name__ == "__main__":
     sys.exit(main())
+