mirror of
https://github.com/vale981/ray
synced 2025-03-06 02:21:39 -05:00
[RLlib] Update alpha_zero_policy.py (#15042)
This commit is contained in:
parent
40fdedd3de
commit
0552f6e886
1 changed files with 3 additions and 3 deletions
|
@ -138,9 +138,9 @@ class AlphaZeroPolicy(TorchPolicy):
|
|||
grad_info = self.extra_grad_info(train_batch)
|
||||
grad_info.update(grad_process_info)
|
||||
grad_info.update({
|
||||
"total_loss": loss_out.detach().numpy(),
|
||||
"policy_loss": policy_loss.detach().numpy(),
|
||||
"value_loss": value_loss.detach().numpy()
|
||||
"total_loss": loss_out.detach().cpu().numpy(),
|
||||
"policy_loss": policy_loss.detach().cpu().numpy(),
|
||||
"value_loss": value_loss.detach().cpu().numpy()
|
||||
})
|
||||
|
||||
return {LEARNER_STATS_KEY: grad_info}
|
||||
|
|
Loading…
Add table
Reference in a new issue