introduced return used in author's code
This commit is contained in:
parent
784a69f80c
commit
9c58ab62c0
@ -400,9 +400,9 @@ class ImagBehavior(nn.Module):
|
|||||||
reward += self._config.actor_state_entropy() * state_ent
|
reward += self._config.actor_state_entropy() * state_ent
|
||||||
value = self.value(imag_feat).mode()
|
value = self.value(imag_feat).mode()
|
||||||
target = tools.lambda_return(
|
target = tools.lambda_return(
|
||||||
reward[:-1],
|
reward[1:],
|
||||||
value[:-1],
|
value[:-1],
|
||||||
discount[:-1],
|
discount[1:],
|
||||||
bootstrap=value[-1],
|
bootstrap=value[-1],
|
||||||
lambda_=self._config.discount_lambda,
|
lambda_=self._config.discount_lambda,
|
||||||
axis=0,
|
axis=0,
|
||||||
|
Loading…
x
Reference in New Issue
Block a user