diff --git a/.github/workflows/benchmark_tests.yml b/.github/workflows/benchmark_tests.yml index 37d6e3fd2..523a31175 100644 --- a/.github/workflows/benchmark_tests.yml +++ b/.github/workflows/benchmark_tests.yml @@ -354,7 +354,7 @@ jobs: cache-from: type=local,src=/tmp/.buildx-cache-robotwin cache-to: type=local,dest=/tmp/.buildx-cache-robotwin,mode=max - - name: Run RoboTwin 2.0 smoke eval (1 episode) + - name: Run RoboTwin 2.0 smoke eval (10 tasks, 1 episode each) if: env.HF_USER_TOKEN != '' run: | # Named container (no --rm) so we can docker cp artifacts out. @@ -368,7 +368,7 @@ jobs: cd /opt/robotwin && lerobot-eval \ --policy.path=lerobot/smolvla_robotwin \ --env.type=robotwin \ - --env.task=beat_block_hammer,click_bell,handover_block,open_laptop,stack_blocks_two \ + --env.task=beat_block_hammer,click_bell,handover_block,open_laptop,stack_blocks_two,click_alarmclock,close_laptop,close_microwave,open_microwave,place_block \ --eval.batch_size=1 \ --eval.n_episodes=1 \ --eval.use_async_envs=false \ @@ -377,7 +377,7 @@ jobs: --output_dir=/tmp/eval-artifacts python /lerobot/scripts/ci/extract_task_descriptions.py \ --env robotwin \ - --task beat_block_hammer,click_bell,handover_block,open_laptop,stack_blocks_two \ + --task beat_block_hammer,click_bell,handover_block,open_laptop,stack_blocks_two,click_alarmclock,close_laptop,close_microwave,open_microwave,place_block \ --output /tmp/eval-artifacts/task_descriptions.json " @@ -394,7 +394,7 @@ jobs: python3 scripts/ci/parse_eval_metrics.py \ --artifacts-dir /tmp/robotwin-artifacts \ --env robotwin \ - --task beat_block_hammer,click_bell,handover_block,open_laptop,stack_blocks_two \ + --task beat_block_hammer,click_bell,handover_block,open_laptop,stack_blocks_two,click_alarmclock,close_laptop,close_microwave,open_microwave,place_block \ --policy lerobot/smolvla_robotwin - name: Upload RoboTwin rollout video