Skip to content

Commit

Permalink
[FluidStack] Fix provisioning and add new gpu types (#4359)
Browse files Browse the repository at this point in the history
[FluidStack] Fix provisioning and add new gpu types

    * Add new `provisioning` status to fix failed deployments

    * Add H100 SXM5 GPU mapping
  • Loading branch information
mjibril authored Nov 18, 2024
1 parent ed4329a commit bf4ef4d
Show file tree
Hide file tree
Showing 2 changed files with 23 additions and 4 deletions.
23 changes: 22 additions & 1 deletion sky/clouds/service_catalog/data_fetchers/fetch_fluidstack.py
Original file line number Diff line number Diff line change
Expand Up @@ -15,6 +15,26 @@
DEFAULT_FLUIDSTACK_API_KEY_PATH = os.path.expanduser('~/.fluidstack/api_key')

plan_vcpus_memory = [{
'gpu_type': 'H100_SXM5_80GB',
'gpu_count': 1,
'min_cpu_count': 52,
'min_memory': 450
}, {
'gpu_type': 'H100_SXM5_80GB',
'gpu_count': 2,
'min_cpu_count': 52,
'min_memory': 450
}, {
'gpu_type': 'H100_SXM5_80GB',
'gpu_count': 4,
'min_cpu_count': 104,
'min_memory': 900
}, {
'gpu_type': 'H100_SXM5_80GB',
'gpu_count': 8,
'min_cpu_count': 192,
'min_memory': 1800
}, {
'gpu_type': 'RTX_A6000_48GB',
'gpu_count': 2,
'min_cpu_count': 12,
Expand Down Expand Up @@ -150,7 +170,8 @@
'H100_PCIE_80GB': 'H100',
'H100_NVLINK_80GB': 'H100',
'A100_NVLINK_80GB': 'A100-80GB',
'A100_SXM4_80GB': 'A100-80GB',
'A100_SXM4_80GB': 'A100-80GB-SXM',
'H100_SXM5_80GB': 'H100-SXM',
'A100_PCIE_80GB': 'A100-80GB',
'A100_SXM4_40GB': 'A100',
'A100_PCIE_40GB': 'A100',
Expand Down
4 changes: 1 addition & 3 deletions sky/provision/fluidstack/instance.py
Original file line number Diff line number Diff line change
Expand Up @@ -79,9 +79,7 @@ def run_instances(region: str, cluster_name_on_cloud: str,
config: common.ProvisionConfig) -> common.ProvisionRecord:
"""Runs instances for the given cluster."""

pending_status = [
'pending',
]
pending_status = ['pending', 'provisioning']
while True:
instances = _filter_instances(cluster_name_on_cloud, pending_status)
if len(instances) > config.count:
Expand Down

0 comments on commit bf4ef4d

Please sign in to comment.