rllib regression

This commit is contained in:
Alex
2021-01-30 04:32:18 +00:00
parent 115afee4c3
commit ceb60965ae
3 changed files with 34456 additions and 8 deletions
@@ -21,11 +21,18 @@ auth:
head_node:
InstanceType: p3.16xlarge
ImageId: latest_dlami
file_mounts:
/compact-regression-tests-torch.yaml: compact-regression-tests-torch.yaml
/compact-regression-tests-tf.yaml: compact-regression-tests-tf.yaml
/run.sh: run.sh
# List of shell commands to run to set up nodes.
setup_commands:
- apt-get install -y libglib2.0-0 libcudnn7=7.6.5.32-1+cuda10.1
- pip install -U https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-2.0.0.dev0-cp37-cp37m-manylinux2014_x86_64.whl
- sudo apt-get install -y libglib2.0-0 libcudnn7=7.6.5.32-1+cuda10.1
- pip install -U https://ray-wheels.s3-us-west-2.amazonaws.com/releases/1.2.0/b4d87b8fc5ff03b868adba35b37da32b7be9f71f/ray-1.2.0-cp37-cp37m-manylinux2014_x86_64.whl
# Command to start ray on the head node. You don't need to change this.
head_start_ray_commands:
File diff suppressed because one or more lines are too long
+3 -6
View File
@@ -30,18 +30,13 @@ case "$i" in
esac
done
if [[ $ray_version == "" || $commit == "" || $ray_branch == "" ]]
then
echo "Provide --ray-version, --commit, and --ray-branch"
exit 1
fi
echo "version: $ray_version"
echo "commit: $commit"
echo "branch: $ray_branch"
echo "workload: ignored"
wheel="https://s3-us-west-2.amazonaws.com/ray-wheels/$ray_branch/$commit/ray-$ray_version-cp37-cp37m-manylinux2014_x86_64.whl"
wheel="https://ray-wheels.s3-us-west-2.amazonaws.com/releases/1.2.0/b4d87b8fc5ff03b868adba35b37da32b7be9f71f/ray-1.2.0-cp37-cp37m-manylinux2014_x86_64.whl"
conda uninstall -y terminado
pip install -U pip
@@ -51,6 +46,8 @@ pip install terminado
pip install torch==1.6 torchvision
pip install boto3==1.4.8 cython==0.29.0
ray stop
# Run tf learning tests.
rllib train -f compact-regression-tests-tf.yaml