Merge pull request #81 from Ruicky8/patch-1
Fix missing advantage computation when reward_EMA is disabled
This commit is contained in:
@@ -409,6 +409,8 @@ class ImagBehavior(nn.Module):
|
||||
metrics.update(tools.tensorstats(normed_target, "normed_target"))
|
||||
metrics["EMA_005"] = to_np(self.ema_vals[0])
|
||||
metrics["EMA_095"] = to_np(self.ema_vals[1])
|
||||
else:
|
||||
adv = target - base
|
||||
|
||||
if self._config.imag_gradient == "dynamics":
|
||||
actor_target = adv
|
||||
|
||||
Reference in New Issue
Block a user