diff --git a/torchy_baselines/a2c/a2c.py b/torchy_baselines/a2c/a2c.py index 8807c91..9e6af14 100644 --- a/torchy_baselines/a2c/a2c.py +++ b/torchy_baselines/a2c/a2c.py @@ -125,7 +125,7 @@ class A2C(PPO): logger.logkv("value_loss", value_loss.item()) logger.logkv("std", th.exp(self.policy.log_std).mean().item()) - def learn(self, total_timesteps, callback=None, log_interval=5, + def learn(self, total_timesteps, callback=None, log_interval=100, eval_env=None, eval_freq=-1, n_eval_episodes=5, tb_log_name="A2C", reset_num_timesteps=True): return super(A2C, self).learn(total_timesteps=total_timesteps, callback=callback, log_interval=log_interval,