Normalize returns

This commit is contained in:
Antonin RAFFIN 2019-11-12 22:32:21 +01:00
parent 623e3cf4f9
commit d725d01186

View file

@ -206,6 +206,7 @@ class TD3(BaseRLModel):
# Normalize returns
# returns = (returns - returns.mean()) / (returns.std() + 1e-8)
returns = (returns - returns.mean())
policy_loss = -(returns * log_prob).mean()