Use observation filter in compute_action for PPO. (#884)

This commit is contained in:
Robert Nishihara 2017-08-28 23:01:29 -07:00 committed by Philipp Moritz
parent 5d72818ddc
commit 60d4d01d06

View file

@ -266,4 +266,5 @@ class PolicyGradient(Algorithm):
for (a, o) in zip(self.agents, extra_data[4])])
def compute_action(self, observation):
observation = self.model.observation_filter(observation)
return self.model.common_policy.compute([observation])[0][0]