mirror of
https://github.com/saymrwulf/stable-baselines3.git
synced 2026-05-28 22:56:53 +00:00
Fix ortho init when bias=False with custom policy (#126)
* Update policies.py fix AttributeError occurred when use "bias=False" linear layer in custom FeaturesExtractor #124 * Update changelog.rst update the changelog accordingly * Update changelog.rst Co-authored-by: Kong Lingchao <konglingchao@gmail.com> Co-authored-by: Antonin RAFFIN <antonin.raffin@ensta.org>
This commit is contained in:
parent
83530560b5
commit
bd2aae0c27
2 changed files with 4 additions and 2 deletions
|
|
@ -31,6 +31,7 @@ Bug Fixes:
|
|||
- Fixed a bug in the ``close()`` method of ``SubprocVecEnv``, causing wrappers further down in the wrapper stack to not be closed. (@NeoExtended)
|
||||
- Fix target for updating q values in SAC: the entropy term was not conditioned by terminals states
|
||||
- Use ``cloudpickle.load`` instead of ``pickle.load`` in ``CloudpickleWrapper``. (@shwang)
|
||||
- Fixed a bug with orthogonal initialization when `bias=False` in custom policy (@rk37)
|
||||
|
||||
Deprecations:
|
||||
^^^^^^^^^^^^^
|
||||
|
|
@ -356,4 +357,4 @@ And all the contributors:
|
|||
@Miffyli @dwiel @miguelrass @qxcv @jaberkow @eavelardev @ruifeng96150 @pedrohbtp @srivatsankrishnan @evilsocket
|
||||
@MarvineGothic @jdossgollin @SyllogismRXS @rusu24edward @jbulow @Antymon @seheevic @justinkterry @edbeeching
|
||||
@flodorner @KuKuXia @NeoExtended @PartiallyTyped @mmcenta @richardwu @kinalmehta @rolandgvc @tkelestemur @mloo3
|
||||
@tirafesi @blurLake @koulakis @joeljosephjin @shwang
|
||||
@tirafesi @blurLake @koulakis @joeljosephjin @shwang @rk37
|
||||
|
|
|
|||
|
|
@ -188,7 +188,8 @@ class BasePolicy(BaseModel):
|
|||
"""
|
||||
if isinstance(module, (nn.Linear, nn.Conv2d)):
|
||||
nn.init.orthogonal_(module.weight, gain=gain)
|
||||
module.bias.data.fill_(0.0)
|
||||
if module.bias is not None:
|
||||
module.bias.data.fill_(0.0)
|
||||
|
||||
@abstractmethod
|
||||
def _predict(self, observation: th.Tensor, deterministic: bool = False) -> th.Tensor:
|
||||
|
|
|
|||
Loading…
Reference in a new issue