We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent fc75c52 commit c70e4b5Copy full SHA for c70e4b5
rsl_rl/algorithms/ppo.py
@@ -361,6 +361,7 @@ def update(self): # noqa: C901
361
num_updates = self.num_learning_epochs * self.num_mini_batches
362
mean_value_loss /= num_updates
363
mean_surrogate_loss /= num_updates
364
+ mean_entropy /= num_updates
365
# -- For RND
366
if mean_rnd_loss is not None:
367
mean_rnd_loss /= num_updates
0 commit comments