fix(policies): support dp train when n_obs_steps=1 (#2430)

Co-authored-by: hukongtao <hukongtao@agibot.com> Co-authored-by: Steven Palma <imstevenpmwork@ieee.org>
2026-07-08 18:41:54 +00:00 · 2026-02-26 00:36:31 +08:00
parent 9a5ab8ffab
commit d0b58190da
1 changed files with 3 additions and 0 deletions
@@ -142,6 +142,9 @@ class DiffusionPolicy(PreTrainedPolicy):
        """Run the batch through the model and compute the loss for training or validation."""
        if self.config.image_features:
            batch = dict(batch)  # shallow copy so that adding a key doesn't modify the original
+            for key in self.config.image_features:
+                if self.config.n_obs_steps == 1 and batch[key].ndim == 4:
+                    batch[key] = batch[key].unsqueeze(1)
            batch[OBS_IMAGES] = torch.stack([batch[key] for key in self.config.image_features], dim=-4)
        loss = self.diffusion.compute_loss(batch)
        # no output_dict so returning None