From cb56f390700be2b5cb16069cc425a5adc07a4358 Mon Sep 17 00:00:00 2001 From: Eric Liang Date: Sat, 29 Sep 2018 22:57:47 -0700 Subject: [PATCH] [rllib] Entropy calculation for diag gaussian missing 0.5 term (#2968) See: https://en.wikipedia.org/wiki/Multivariate_normal_distribution#Entropy --- python/ray/rllib/models/action_dist.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/ray/rllib/models/action_dist.py b/python/ray/rllib/models/action_dist.py index fb3c61a11..b0cfe4141 100644 --- a/python/ray/rllib/models/action_dist.py +++ b/python/ray/rllib/models/action_dist.py @@ -125,7 +125,7 @@ class DiagGaussian(ActionDistribution): def entropy(self): return tf.reduce_sum( - self.log_std + .5 * np.log(2.0 * np.pi * np.e), + .5 * self.log_std + .5 * np.log(2.0 * np.pi * np.e), reduction_indices=[1]) def sample(self):