Checkpoint Adam momenta for DDPG (#7449)

This commit is contained in:
Eric Liang 2020-03-04 10:03:41 -08:00 committed by GitHub
parent fe7820fec9
commit aa4861c2a0
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23

View file

@ -295,7 +295,8 @@ class DDPGTFPolicy(DDPGPostprocessing, TFPolicy):
# Note that this encompasses both the policy and Q-value networks and
# their corresponding target networks
self.variables = ray.experimental.tf_utils.TensorFlowVariables(
tf.group(q_t_det_policy, q_tp1), self.sess)
tf.group(q_t_det_policy, q_tp1, self._actor_optimizer.variables(),
self._critic_optimizer.variables()), self.sess)
# Hard initial update
self.update_target(tau=1.0)