Merge branch 'feat/smolvla-on-steerable' of https://github.com/huggingface/lerobot into feat/smolvla-on-steerable

2026-07-24 10:16:09 +00:00 · 2026-05-25 16:56:50 +02:00
parent 1e9a6d044d 3fdfcb912a
commit da3e87ee86
2 changed files with 109 additions and 10 deletions
@@ -14,13 +14,15 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
-"""Rebuild the 16 RoboCasa composite_seen tarballs into one unified LeRobot v3 dataset.
+"""Rebuild RoboCasa tarballs into one unified LeRobot v3 dataset.
-Filter-only wrapper around the canonical RoboCasa port script — restricts the
+Discovers tasks from RoboCasa's ``box_links_ds.json`` for a given ``--split``
-discovered task set to the 16 ``composite_seen`` tasks (the multi-step subset
+(``target`` or ``pretrain``) and ``--source`` (``human`` / ``mimicgen``), then
-of the official RoboCasa365 target benchmark) so a single command produces the
+filters to a chosen ``--task-set`` (``composite_seen``, ``composite_unseen``,
-exact dataset slice needed for an apples-to-apples pi05 vs pi052 comparison
+``composite_all``, ``atomic``, ``composite_atomic``, ``all``) or an explicit
-on multi-step kitchen manipulation.
+``--tasks`` list. Same code path produces the 16-task ``composite_seen`` slice,
 the full 50-task target benchmark, the 300-task ``Human300`` pretraining
 slice, or any 2-task smoke set.
 Per-rank, each datatrove worker:
@@ -83,8 +85,7 @@ DEFAULT_SPLIT = "target"
 DEFAULT_SOURCE = "human"
 DEFAULT_ROBOT_TYPE = "robocasa"
-# The 16 composite_seen tasks (RoboCasa365 target benchmark, multi-step subset).
+# RoboCasa365 target benchmark task groupings. Order matches the official docs.
 # Order matches the official RoboCasa documentation.
 COMPOSITE_SEEN_TASKS: list[str] = [
    "DeliverStraw",
    "GetToastedBread",
@@ -104,9 +105,52 @@ COMPOSITE_SEEN_TASKS: list[str] = [
    "WashLettuce",
 ]
-# Other groupings, exposed via ``--task-set`` for symmetry — populated lazily.
+COMPOSITE_UNSEEN_TASKS: list[str] = [
    "ArrangeBreadBasket",
    "ArrangeTea",
    "BreadSelection",
    "CategorizeCondiments",
    "CuttingToolSelection",
    "GarnishPancake",
    "GatherTableware",
    "HeatKebabSandwich",
    "MakeIceLemonade",
    "PanTransfer",
    "PortionHotDogs",
    "RecycleBottlesByType",
    "SeparateFreezerRack",
    "WaffleReheat",
    "WashFruitColander",
    "WeighIngredients",
 ]
 ATOMIC_TASKS: list[str] = [
    "CloseBlenderLid",
    "CloseFridge",
    "CloseToasterOvenDoor",
    "CoffeeSetupMug",
    "NavigateKitchen",
    "OpenCabinet",
    "OpenDrawer",
    "OpenStandMixerHead",
    "PickPlaceCounterToCabinet",
    "PickPlaceCounterToStove",
    "PickPlaceDrawerToCounter",
    "PickPlaceSinkToCounter",
    "PickPlaceToasterToCounter",
    "SlideDishwasherRack",
    "TurnOffStove",
    "TurnOnElectricKettle",
    "TurnOnMicrowave",
    "TurnOnSinkFaucet",
 ]
 TASK_SETS: dict[str, list[str]] = {
    "composite_seen": COMPOSITE_SEEN_TASKS,
    "composite_unseen": COMPOSITE_UNSEEN_TASKS,
    "composite_all": COMPOSITE_SEEN_TASKS + COMPOSITE_UNSEEN_TASKS,
    "atomic": ATOMIC_TASKS,
    "composite_atomic": COMPOSITE_SEEN_TASKS + COMPOSITE_UNSEEN_TASKS + ATOMIC_TASKS,
    "all": [],  # sentinel — no filter
 }
@@ -658,6 +702,7 @@ class AggregateRoboCasaUnifiedShards(PipelineStep):
        output_root: str,
        push: bool = True,
        overwrite: bool = False,
        hub_tags: list[str] | None = None,
    ):
        super().__init__()
        self.output_repo_id = output_repo_id
@@ -665,6 +710,7 @@ class AggregateRoboCasaUnifiedShards(PipelineStep):
        self.output_root = Path(output_root)
        self.push = push
        self.overwrite = overwrite
        self.hub_tags = hub_tags or ["lerobot", "robocasa", "unified"]
    def run(self, data=None, rank: int = 0, world_size: int = 1):
        import json
@@ -724,7 +770,7 @@ class AggregateRoboCasaUnifiedShards(PipelineStep):
        if self.push:
            dataset = LeRobotDataset(repo_id=self.output_repo_id, root=self.output_root)
            dataset.push_to_hub(
-                tags=["lerobot", "robocasa", "composite_seen", "unified"],
+                tags=self.hub_tags,
                private=False,
            )
            logging.info("Pushed to https://huggingface.co/datasets/%s", self.output_repo_id)
@@ -799,6 +845,7 @@ def make_aggregate_executor(
    mem_per_cpu: str,
    time_limit: str,
    slurm: bool,
    hub_tags: list[str] | None = None,
    depends: SlurmPipelineExecutor | None = None,
 ):
    kwargs = {
@@ -809,6 +856,7 @@ def make_aggregate_executor(
                output_root=str(output_root),
                push=push,
                overwrite=overwrite,
                hub_tags=hub_tags,
            )
        ],
        "logging_dir": str(logs_dir / job_name),
@@ -969,6 +1017,9 @@ def main():
            prepare_executor.run()
    if args.mode in {"all", "aggregate"}:
        hub_tags = ["lerobot", "robocasa", "unified", args.split, args.source]
        if not args.tasks and args.task_set != "all":
            hub_tags.append(args.task_set)
        aggregate_executor = make_aggregate_executor(
            output_repo_id=output_repo_id,
            shard_roots=shard_roots,
@@ -982,6 +1033,7 @@ def main():
            mem_per_cpu=args.mem_per_cpu,
            time_limit=args.time,
            slurm=args.slurm == 1,
            hub_tags=hub_tags,
            depends=prepare_executor if args.mode == "all" and args.slurm == 1 else None,
        )
        if args.mode == "all" and args.slurm == 1:
@@ -0,0 +1,47 @@
 #!/bin/bash
 # Build a tiny RoboCasa smoke dataset (2 short atomic tasks, all episodes) for
 # fast end-to-end training validation before the real run.
 #
 # Defaults: target/human, OpenStandMixerHead + NavigateKitchen (~1k episodes,
 # ~131k frames, ~109 min @ 20 fps), 2 SLURM workers on hopper-cpu.
 #
 # Override via env: TASKS, REPO_ID, WORK_DIR, WORKERS, CPUS, PARTITION, LOCAL=1.
 set -euo pipefail
 cd "${LEROBOT_ROOT:-$HOME/lerobot}"
 source ~/miniconda3/etc/profile.d/conda.sh
 conda activate lerobot
 REPO_ID="${REPO_ID:-${HF_USER:?HF_USER is unset}/robocasa_smoke_2atomic_v3}"
 WORK_DIR="${WORK_DIR:-/fsx/${USER}/robocasa/datasets/v1.0}"
 ROBOCASA_ROOT="${ROBOCASA_ROOT:-/fsx/${USER}/robocasa}"
 LOGS_DIR="${LOGS_DIR:-/fsx/${USER}/logs/robocasa}"
 TASKS="${TASKS:-OpenStandMixerHead NavigateKitchen}"
 WORKERS="${WORKERS:-2}"
 CPUS="${CPUS:-8}"
 PARTITION="${PARTITION:-hopper-cpu}"
 LOCAL="${LOCAL:-0}"
 ARGS=(
    examples/port_datasets/slurm_build_robocasa_composite_seen.py
    --repo-id="$REPO_ID"
    --work-dir="$WORK_DIR"
    --robocasa-root="$ROBOCASA_ROOT"
    --split=target --source=human
    --tasks $TASKS
    --workers="$WORKERS"
    --cpus-per-task="$CPUS"
    --partition="$PARTITION"
    --mem-per-cpu=4G
    --time=04:00:00
    --logs-dir="$LOGS_DIR"
    --job-name=port_robocasa_smoke
 )
 if [[ "$LOCAL" == "1" ]]; then
    ARGS+=(--slurm=0)
 fi
 echo "Smoke dataset: $REPO_ID"
 echo "Tasks: $TASKS"
 python "${ARGS[@]}"