From aaf8576411492db07ec04f9987d2207a69a46c2c Mon Sep 17 00:00:00 2001 From: Khalil Meftah Date: Thu, 19 Mar 2026 12:36:02 +0100 Subject: [PATCH] chore: rename losses --- src/lerobot/rl/algorithms/sac/sac_algorithm.py | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/src/lerobot/rl/algorithms/sac/sac_algorithm.py b/src/lerobot/rl/algorithms/sac/sac_algorithm.py index 55b228026..6d24db39c 100644 --- a/src/lerobot/rl/algorithms/sac/sac_algorithm.py +++ b/src/lerobot/rl/algorithms/sac/sac_algorithm.py @@ -189,7 +189,7 @@ class SACAlgorithm(RLAlgorithm): critic_loss_val = loss_critic.item() stats = TrainingStats( - losses={"critic": critic_loss_val}, + losses={"loss_critic": critic_loss_val}, grad_norms={"critic": critic_grad_norm}, ) @@ -202,7 +202,7 @@ class SACAlgorithm(RLAlgorithm): max_norm=self.config.clip_grad_norm, ).item() self.optimizers["discrete_critic"].step() - stats.losses["discrete_critic"] = loss_discrete.item() + stats.losses["loss_discrete_critic"] = loss_discrete.item() stats.grad_norms["discrete_critic"] = dc_grad if self._optimization_step % self.config.policy_update_freq == 0: @@ -225,8 +225,8 @@ class SACAlgorithm(RLAlgorithm): ).item() self.optimizers["temperature"].step() - stats.losses["actor"] = actor_loss.item() - stats.losses["temperature"] = temp_loss.item() + stats.losses["loss_actor"] = actor_loss.item() + stats.losses["loss_temperature"] = temp_loss.item() stats.grad_norms["actor"] = actor_grad stats.grad_norms["temperature"] = temp_grad stats.extra["temperature"] = self.temperature