diff --git a/ci/stress_tests/atari_impala_xlarge.yaml b/ci/stress_tests/atari_impala_xlarge.yaml new file mode 100644 index 000000000..8dd3dd4ab --- /dev/null +++ b/ci/stress_tests/atari_impala_xlarge.yaml @@ -0,0 +1,24 @@ +# Taken from rllib/tuned_examples/atari_impala_large.yaml + +# Runs on a g3.16xl node with 5 m5.24xl workers +# Takes roughly 10 minutes. x10? +atari-impala: + env: + grid_search: + - BreakoutNoFrameskip-v4 + - BeamRiderNoFrameskip-v4 + - QbertNoFrameskip-v4 + - SpaceInvadersNoFrameskip-v4 + run: IMPALA + stop: + timesteps_total: 30000000 + config: + sample_batch_size: 50 + train_batch_size: 500 + num_workers: 128 + num_envs_per_worker: 5 + clip_rewards: True + lr_schedule: [ + [0, 0.0005], + [20000000, 0.000000000001], + ] \ No newline at end of file