diff --git a/src/lerobot/policies/pi05_full/annotate/annotate_libero.sh b/src/lerobot/policies/pi05_full/annotate/annotate_libero.sh index 0e5a3d8f0..cd2d61bec 100644 --- a/src/lerobot/policies/pi05_full/annotate/annotate_libero.sh +++ b/src/lerobot/policies/pi05_full/annotate/annotate_libero.sh @@ -4,25 +4,25 @@ # This generates user prompts and robot utterances for hierarchical policy training # Configuration -REPO_ID="lerobot/libero_video" +REPO_ID="lerobot/libero_10" MODEL="Qwen/Qwen3-VL-30B-A3B-Instruct" # or: MODEL="Qwen/Qwen2-VL-7B-Instruct" -OUTPUT_DIR="/fsx/jade_choghari/outputs/libero-annotate" +OUTPUT_DIR="/fsx/jade_choghari/outputs/libero-10-annotate-high" BATCH_SIZE=16 TEMPERATURE=0.9 SAMPLE_INTERVAL=5.0 # generate dialogue every 1 second (all episodes processed) # Run subtask annotation -python /admin/home/jade_choghari/lerobot/src/lerobot/policies/pi05_full/annotate/subtask_annotate.py \ - --repo-id "$REPO_ID" \ - --video-key observation.images.image \ - --output-dir "$OUTPUT_DIR" \ - --skip-existing \ - --output-repo-id "jadechoghari/libero-annotate" \ - --batch-size "$BATCH_SIZE" \ +# python /admin/home/jade_choghari/lerobot/src/lerobot/policies/pi05_full/annotate/subtask_annotate.py \ +# --repo-id "$REPO_ID" \ +# --video-key observation.images.image \ +# --output-dir "$OUTPUT_DIR" \ +# --skip-existing \ +# --output-repo-id "jadechoghari/libero10-annotate" \ +# --batch-size "$BATCH_SIZE" \ # run synthetic data generation (all episodes processed) # python examples/dataset/annotate_pgen.py \ # --repo-id "$REPO_ID" \ @@ -41,10 +41,10 @@ python /admin/home/jade_choghari/lerobot/src/lerobot/policies/pi05_full/annotate # add --push-to-hub flag # efficient batch processing: 4 episodes at once -# python /admin/home/jade_choghari/lerobot/src/lerobot/policies/pi05_full/annotate/high_level_annotate.py \ -# --repo-id "$REPO_ID" \ -# --output-dir "$OUTPUT_DIR" \ -# --video-mode \ -# --video-key observation.images.image \ -# --video-batch-size "$BATCH_SIZE" \ -# --sample-interval 5.0 +python /admin/home/jade_choghari/lerobot/src/lerobot/policies/pi05_full/annotate/high_level_annotate.py \ + --data-dir "/fsx/jade_choghari/outputs/libero-10-annotate" \ + --output-dir "$OUTPUT_DIR" \ + --video-mode \ + --video-key observation.images.image \ + --video-batch-size "$BATCH_SIZE" \ + --sample-interval 5.0 diff --git a/src/lerobot/policies/pi05_full/annotate/high_level_annotate.py b/src/lerobot/policies/pi05_full/annotate/high_level_annotate.py index d00931a4d..a37d4b6fa 100644 --- a/src/lerobot/policies/pi05_full/annotate/high_level_annotate.py +++ b/src/lerobot/policies/pi05_full/annotate/high_level_annotate.py @@ -769,7 +769,6 @@ def _parse_video_response(response: str, timestamps_with_skills: list[dict]) -> }) return results - breakpoint() # Fallback: return empty results for each timestamp print(f"Warning: Could not parse video response: {response[:200]}...") return [ diff --git a/src/lerobot/policies/pi05_full/annotate/load_lerobot_high.py b/src/lerobot/policies/pi05_full/annotate/load_lerobot_high.py index 0c6011c20..681fe72e8 100644 --- a/src/lerobot/policies/pi05_full/annotate/load_lerobot_high.py +++ b/src/lerobot/policies/pi05_full/annotate/load_lerobot_high.py @@ -4,7 +4,7 @@ from huggingface_hub import HfApi import lerobot from lerobot.datasets.lerobot_dataset import LeRobotDataset, LeRobotDatasetMetadata -dataset = LeRobotDataset(repo_id="local", root="/fsx/jade_choghari/outputs/pgen_annotations1") +dataset = LeRobotDataset(repo_id="local", root="/fsx/jade_choghari/.cache/huggingface/lerobot/lerobot/libero_10/") dataloader = torch.utils.data.DataLoader( dataset, @@ -23,9 +23,9 @@ print(batch['task'][0]) # read this parquet /fsx/jade_choghari/outputs/pgen_annotations1/meta/tasks.parquett -import pandas as pd -tasks_df = pd.read_parquet('/fsx/jade_choghari/outputs/pgen_annotations1/meta/tasks.parquet') +# import pandas as pd +# tasks_df = pd.read_parquet('/fsx/jade_choghari/outputs/pgen_annotations1/meta/tasks.parquet') -# print all -print(tasks_df.columns) -breakpoint() \ No newline at end of file +# # print all +# print(tasks_df.columns) +# breakpoint() \ No newline at end of file