diff --git a/rllib/agents/ppo/ppo_torch_policy.py b/rllib/agents/ppo/ppo_torch_policy.py index a268e7487..fa2ca6c1d 100644 --- a/rllib/agents/ppo/ppo_torch_policy.py +++ b/rllib/agents/ppo/ppo_torch_policy.py @@ -244,7 +244,7 @@ class ValueNetworkMixin: # When not doing GAE, we do not require the value function's output. else: - def value(ob, prev_action, prev_reward, *state): + def value(*args, **kwargs): return 0.0 self._value = value