From 3322558287e701d1d1d6a7d7894c08087d55b465 Mon Sep 17 00:00:00 2001 From: Alex Wu Date: Tue, 26 Jul 2022 23:14:49 -0700 Subject: [PATCH] [autoscaler][aws] Fix example minimal (#27075) Why are these changes needed? The DLAMI moved underneath us and broke for 2 reasons. The AMI's snapshot size increased to 140 GB which was more than our hardcoded max EBS volume size of 100GB The AMI dropped support for python 3.7 and only has 3.8 now. The solutions short term solutions are simple. Allocate a bigger EBS volume. Use the tensorflow 3.8 env. Related issue number Closes #26368 Co-authored-by: Alex --- python/ray/autoscaler/aws/defaults.yaml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/python/ray/autoscaler/aws/defaults.yaml b/python/ray/autoscaler/aws/defaults.yaml index 81141e7ddb8d3..c22a97fbf0d22 100644 --- a/python/ray/autoscaler/aws/defaults.yaml +++ b/python/ray/autoscaler/aws/defaults.yaml @@ -60,7 +60,7 @@ available_node_types: BlockDeviceMappings: - DeviceName: /dev/sda1 Ebs: - VolumeSize: 100 + VolumeSize: 256 # Additional options in the boto docs. ray.worker.default: # The minimum number of nodes of this type to launch. @@ -122,9 +122,9 @@ initialization_commands: [] # List of shell commands to run to set up nodes. setup_commands: - >- - (stat $HOME/anaconda3/envs/tensorflow2_latest_p37/ &> /dev/null && - echo 'export PATH="$HOME/anaconda3/envs/tensorflow2_latest_p37/bin:$PATH"' >> ~/.bashrc) || true - - which ray || pip install -U "ray[default] @ https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-3.0.0.dev0-cp37-cp37m-manylinux2014_x86_64.whl" + (stat $HOME/anaconda3/envs/tensorflow2_p38/ &> /dev/null && + echo 'export PATH="$HOME/anaconda3/envs/tensorflow2_p38/bin:$PATH"' >> ~/.bashrc) || true + - which ray || pip install -U "ray[default] @ https://s3-us-west-2.amazonaws.com/ray-wheels/latest/ray-3.0.0.dev0-cp38-cp38-manylinux2014_x86_64.whl" # Custom commands that will be run on the head node after common setup. head_setup_commands: