DROID training

kvablack · kvablack · commit cdf8436b6f55 · 2025-08-26T17:46:26.000Z
diff --git a/examples/droid/README_train.md b/examples/droid/README_train.md
@@ -15,15 +15,11 @@ uv sync --group rlds
 
 ## Download DROID dataset
 
-You can download a (slightly outdated) version of DROID with the following command (after installing the `gsutil` google cloud CLI):
+You can download the DROID dataset with the following command (after installing the `gsutil` google cloud CLI):
 ```
-gsutil -m cp -r gs://gresearch/robotics/droid <your_download_path>
+gsutil -m cp -r gs://gresearch/robotics/droid/1.0.1 <your_download_path>
 ```
 
-Note that this version of DROID is slightly outdated: it only contains a partial set of language annotations (~30k episodes).
-Please email [karl.pertsch@gmail.com](mailto:karl.pertsch@gmail.com) to get access to the most up-to-date version of the DROID RLDS dataset (with language annotations on 75k episodes)!
-(sorry, we are working on updating the version on the official bucket).
-
 You will need 1.8TB of disk storage to download the DROID RLDS dataset.
 
 ## Run
diff --git a/src/openpi/shared/download.py b/src/openpi/shared/download.py
@@ -1,6 +1,5 @@
 import concurrent.futures
 import datetime
-import getpass
 import logging
 import os
 import pathlib
@@ -17,16 +16,13 @@
 
 # Environment variable to control cache directory path, ~/.cache/openpi will be used by default.
 _OPENPI_DATA_HOME = "OPENPI_DATA_HOME"
+DEFAULT_CACHE_DIR = "~/.cache/openpi"
 
 logger = logging.getLogger(__name__)
 
 
 def get_cache_dir() -> pathlib.Path:
-    default_dir = "~/.cache/openpi"
-    if os.path.exists("/mnt/weka"):  # noqa: PTH110
-        default_dir = f"/mnt/weka/{getpass.getuser()}/.cache/openpi"
-
-    cache_dir = pathlib.Path(os.getenv(_OPENPI_DATA_HOME, default_dir)).expanduser().resolve()
+    cache_dir = pathlib.Path(os.getenv(_OPENPI_DATA_HOME, DEFAULT_CACHE_DIR)).expanduser().resolve()
     cache_dir.mkdir(parents=True, exist_ok=True)
     _set_folder_permission(cache_dir)
     return cache_dir
diff --git a/src/openpi/training/config.py b/src/openpi/training/config.py
@@ -379,7 +379,7 @@ def create(self, assets_dirs: pathlib.Path, model_config: _model.BaseModelConfig
         )
 
         data_transforms = _transforms.Group(
-            inputs=[droid_policy.DroidInputs(action_dim=model_config.action_dim, model_type=model_config.model_type)],
+            inputs=[droid_policy.DroidInputs(model_type=model_config.model_type)],
             outputs=[droid_policy.DroidOutputs()],
         )
 
@@ -837,6 +837,42 @@ def __post_init__(self) -> None:
         keep_period=20_000,
         num_workers=0,  # Important: RLDS DataLoader requires num_workers=0, handles multi-processing internally
     ),
+    TrainConfig(
+        # This config is for fine-tuning pi05 on the *full* DROID dataset.
+        # We use RLDS data loading to make training on this large dataset tractable.
+        # For fine-tuning on your own DROID dataset, see below.
+        name="pi05_full_droid_finetune",
+        model=pi0.Pi0Config(
+            pi05=True,
+            action_dim=32,
+            action_horizon=16,
+        ),
+        data=RLDSDroidDataConfig(
+            repo_id="droid",
+            # Set this to the path to your DROID RLDS dataset (the parent directory of the `droid` directory).
+            rlds_data_dir="/mnt/pi-data/kevin",
+            action_space=droid_rlds_dataset.DroidActionSpace.JOINT_POSITION,
+            assets=AssetsConfig(
+                assets_dir="gs://openpi-assets-preview/checkpoints/pi05_may21_280k_v1/assets/",
+                asset_id="droid",
+            ),
+        ),
+        weight_loader=weight_loaders.CheckpointWeightLoader(
+            "gs://openpi-assets-preview/checkpoints/pi05_may21_280k_v1/params"
+        ),
+        lr_schedule=_optimizer.CosineDecaySchedule(
+            warmup_steps=1_000,
+            peak_lr=5e-5,
+            decay_steps=1_000_000,
+            decay_lr=5e-5,
+        ),
+        num_train_steps=100_000,
+        batch_size=256,
+        log_interval=100,
+        save_interval=5000,
+        keep_period=10_000,
+        num_workers=0,  # Important: RLDS DataLoader requires num_workers=0, handles multi-processing internally
+    ),
     TrainConfig(
         # This config is for fine-tuning pi05-DROID on a custom (smaller) DROID dataset.
         # Here, we use LeRobot data format (like for all other fine-tuning examples)