From 9a9bc3b42c0abe37a76688c54525f361ebbb5cd4 Mon Sep 17 00:00:00 2001 From: Pepijn Date: Thu, 9 Apr 2026 14:53:51 +0200 Subject: [PATCH] fix(ci): call extract_task_descriptions.py after eval in benchmark jobs MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit The task descriptions were never populated in metrics.json because extract_task_descriptions.py was never invoked. The script exists and parse_eval_metrics.py already looks for its output — the call was simply missing from the workflow. Appends the extraction step to the existing bash -c block (runs inside the container where libero/metaworld is installed) so task_descriptions.json is written to the eval-artifacts dir before docker cp copies it out. Co-Authored-By: Claude Opus 4.6 (1M context) --- .github/workflows/benchmark_tests.yml | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/.github/workflows/benchmark_tests.yml b/.github/workflows/benchmark_tests.yml index afdc51814..9ba8c4b64 100644 --- a/.github/workflows/benchmark_tests.yml +++ b/.github/workflows/benchmark_tests.yml @@ -128,6 +128,9 @@ jobs: '--env.camera_name_mapping={\"agentview_image\": \"camera1\", \"robot0_eye_in_hand_image\": \"camera2\"}' \ --policy.empty_cameras=1 \ --output_dir=/tmp/eval-artifacts + python scripts/ci/extract_task_descriptions.py \ + --env libero --task libero_spatial \ + --output /tmp/eval-artifacts/task_descriptions.json " - name: Copy Libero artifacts from container @@ -268,6 +271,9 @@ jobs: '--rename_map={\"observation.image\": \"observation.images.camera1\"}' \ --policy.empty_cameras=2 \ --output_dir=/tmp/eval-artifacts + python scripts/ci/extract_task_descriptions.py \ + --env metaworld --task metaworld-push-v3 \ + --output /tmp/eval-artifacts/task_descriptions.json " - name: Copy MetaWorld artifacts from container