Merge pull request #81 from Ruicky8/patch-1

Fix missing advantage computation when reward_EMA is disabled
This commit is contained in:
Naoki Morihira
2026-03-08 13:31:20 +09:00
committed by GitHub

View File

@@ -409,6 +409,8 @@ class ImagBehavior(nn.Module):
metrics.update(tools.tensorstats(normed_target, "normed_target"))
metrics["EMA_005"] = to_np(self.ema_vals[0])
metrics["EMA_095"] = to_np(self.ema_vals[1])
else:
adv = target - base
if self._config.imag_gradient == "dynamics":
actor_target = adv