diff --git a/doc/source/rllib-training.rst b/doc/source/rllib-training.rst index 0171de62f..9f8b0bf1f 100644 --- a/doc/source/rllib-training.rst +++ b/doc/source/rllib-training.rst @@ -41,7 +41,7 @@ can be used) and for choosing the algorithm with ``--run`` Specifying Parameters ~~~~~~~~~~~~~~~~~~~~~ -Each algorithm has specific hyperparameters that can be set with ``--config``. See the +Each algorithm has specific hyperparameters that can be set with ``--config``, in addition to a number of `common hyperparameters `__. See the `algorithms documentation `__ for more information. In an example below, we train A3C by specifying 8 workers through the config flag. diff --git a/python/ray/rllib/agents/a3c/a3c.py b/python/ray/rllib/agents/a3c/a3c.py index a67a598f8..51537072f 100644 --- a/python/ray/rllib/agents/a3c/a3c.py +++ b/python/ray/rllib/agents/a3c/a3c.py @@ -30,7 +30,8 @@ DEFAULT_CONFIG = with_common_config({ "use_gpu_for_workers": False, # Whether to emit extra summary stats "summarize": False, - # Workers sample async + # Workers sample async. Note that this increases the effective + # sample_batch_size by up to 5x due to async buffering of batches. "sample_async": True, # Model and preprocessor options "model": {