[rllib] Fix error getting kl when simple_optimizer: True in multi-agent PPO

This commit is contained in:
Eric Liang
2019-05-27 17:24:45 -07:00
committed by GitHub
parent a45c61e19b
commit d7be5a5d36
3 changed files with 6 additions and 1 deletions
@@ -30,6 +30,7 @@ parser = argparse.ArgumentParser()
parser.add_argument("--num-agents", type=int, default=4)
parser.add_argument("--num-policies", type=int, default=2)
parser.add_argument("--num-iters", type=int, default=20)
parser.add_argument("--simple", action="store_true")
class CustomModel1(Model):
@@ -103,6 +104,7 @@ if __name__ == "__main__":
config={
"env": "multi_cartpole",
"log_level": "DEBUG",
"simple_optimizer": args.simple,
"num_sgd_iter": 10,
"multiagent": {
"policies": policies,
@@ -69,7 +69,7 @@ class SyncSamplesOptimizer(PolicyOptimizer):
self.num_steps_sampled += samples.count
self.num_steps_trained += samples.count
return fetches
return self.learner_stats
@override(PolicyOptimizer)
def stats(self):