diff --git a/tianshou/__init__.py b/tianshou/__init__.py index f0cc7c75d..71f5e0a70 100644 --- a/tianshou/__init__.py +++ b/tianshou/__init__.py @@ -1,6 +1,6 @@ from tianshou import data, env, exploration, policy, trainer, utils -__version__ = "0.4.10" +__version__ = "0.4.11" __all__ = [ "env", diff --git a/tianshou/policy/modelfree/pg.py b/tianshou/policy/modelfree/pg.py index 1557c1ad6..4f0b1b182 100644 --- a/tianshou/policy/modelfree/pg.py +++ b/tianshou/policy/modelfree/pg.py @@ -105,7 +105,7 @@ def forward( Please refer to :meth:`~tianshou.policy.BasePolicy.forward` for more detailed explanation. """ - logits, hidden = self.actor(batch.obs, state=state) + logits, hidden = self.actor(batch.obs, state=state, info=batch.info) if isinstance(logits, tuple): dist = self.dist_fn(*logits) else: