[rllib] Fix PPO regression

2026-06-27 20:22:39 +08:00 · 2018-06-28 16:00:53 -07:00
parent 89460b8d11
commit 92ab7e56ec
1 changed files with 1 additions and 2 deletions
@@ -65,8 +65,7 @@ class LocalMultiGPUOptimizer(PolicyOptimizer):
        # all of the device copies are created.
        with self.local_evaluator.tf_sess.graph.as_default():
            with self.local_evaluator.tf_sess.as_default():
-                main_scope = tf.get_variable_scope()
-                with tf.variable_scope(main_scope, reuse=tf.AUTO_REUSE):
+                with tf.variable_scope("default", reuse=tf.AUTO_REUSE):
                    self.par_opt = LocalSyncParallelOptimizer(
                        tf.train.AdamOptimizer(self.sgd_stepsize),
                        self.devices,