refactor(policies): Remove unnormalization step from action predictions

- Eliminated the unnormalization of actions in both `TDMPCPolicy` and `VQBeTPolicy` classes to streamline action prediction. - This change improves code clarity and aligns with recent updates to policy processors.
2026-07-09 11:01:53 +00:00 · 2025-07-07 17:56:34 +02:00
parent 7eccefe235
commit 7bd0d62ce5
2 changed files with 0 additions and 2 deletions
@@ -129,7 +129,6 @@ class TDMPCPolicy(PreTrainedPolicy):

        actions = torch.clamp(actions, -1, +1)

-        actions = self.unnormalize_outputs({ACTION: actions})[ACTION]
        return actions

    @torch.no_grad()
@@ -118,7 +118,6 @@ class VQBeTPolicy(PreTrainedPolicy):
    def predict_action_chunk(self, batch: dict[str, Tensor]) -> Tensor:
        batch = {k: torch.stack(list(self._queues[k]), dim=1) for k in batch if k in self._queues}
        actions = self.vqbet(batch, rollout=True)[:, : self.config.action_chunk_size]
-        actions = self.unnormalize_outputs({ACTION: actions})[ACTION]
        return actions

    @torch.no_grad()