introduced return used in author's code
This commit is contained in:
@@ -400,9 +400,9 @@ class ImagBehavior(nn.Module):
|
|||||||
reward += self._config.actor_state_entropy() * state_ent
|
reward += self._config.actor_state_entropy() * state_ent
|
||||||
value = self.value(imag_feat).mode()
|
value = self.value(imag_feat).mode()
|
||||||
target = tools.lambda_return(
|
target = tools.lambda_return(
|
||||||
reward[:-1],
|
reward[1:],
|
||||||
value[:-1],
|
value[:-1],
|
||||||
discount[:-1],
|
discount[1:],
|
||||||
bootstrap=value[-1],
|
bootstrap=value[-1],
|
||||||
lambda_=self._config.discount_lambda,
|
lambda_=self._config.discount_lambda,
|
||||||
axis=0,
|
axis=0,
|
||||||
|
|||||||
Reference in New Issue
Block a user