remove dino vision encoder and simplify text and vision encoders by removing inheritance structure

This commit is contained in:
Bryson Jones
2025-12-10 11:09:37 -08:00
parent 55e19ff9a7
commit adabb37af6
4 changed files with 42 additions and 186 deletions
+1 -1
View File
@@ -122,7 +122,7 @@ phone = ["hebi-py>=2.8.0,<2.12.0", "teleop>=0.1.0,<0.2.0", "fastapi<1.0"]
# Policies
pi = ["transformers @ git+https://github.com/huggingface/transformers.git@fix/lerobot_openpi"]
smolvla = ["lerobot[transformers-dep]", "num2words>=0.5.14,<0.6.0", "accelerate>=1.7.0,<2.0.0", "safetensors>=0.4.3,<1.0.0"]
multi_task_dit = ["lerobot[transformers-dep]", "timm>=1.0.20"]
multi_task_dit = ["lerobot[transformers-dep]"]
groot = [
"lerobot[transformers-dep]",
"peft>=0.13.0,<1.0.0",