mirror of
https://github.com/wassname/ray.git
synced 2026-07-04 07:35:11 +08:00
fix free log std param (#964)
This commit is contained in:
committed by
Philipp Moritz
parent
99c8b1f38c
commit
e17412a72b
@@ -32,7 +32,7 @@ class ProximalPolicyLoss(object):
|
||||
# Do not split the last layer of the value function into
|
||||
# mean parameters and standard deviation parameters and
|
||||
# do not make the standard deviations free variables.
|
||||
vf_config["free_logstd"] = False
|
||||
vf_config["free_log_std"] = False
|
||||
with tf.variable_scope("value_function"):
|
||||
self.value_function = ModelCatalog.get_model(
|
||||
observations, 1, vf_config).outputs
|
||||
|
||||
Reference in New Issue
Block a user