From 76cdcc180998e57b21634717ffdcb1368d11915e Mon Sep 17 00:00:00 2001 From: Anna Pendleton Date: Wed, 18 Sep 2024 17:26:41 +0000 Subject: [PATCH] small fixes --- .../hpa-templates/hpa.vllm.custom_metric.yaml.tftpl | 10 ---------- benchmarks/inference-server/vllm/variables.tf | 6 ++---- 2 files changed, 2 insertions(+), 14 deletions(-) diff --git a/benchmarks/inference-server/vllm/hpa-templates/hpa.vllm.custom_metric.yaml.tftpl b/benchmarks/inference-server/vllm/hpa-templates/hpa.vllm.custom_metric.yaml.tftpl index 2c318d848..956241afd 100644 --- a/benchmarks/inference-server/vllm/hpa-templates/hpa.vllm.custom_metric.yaml.tftpl +++ b/benchmarks/inference-server/vllm/hpa-templates/hpa.vllm.custom_metric.yaml.tftpl @@ -11,15 +11,6 @@ spec: minReplicas: ${hpa_min_replicas} maxReplicas: ${hpa_max_replicas} metrics: -%{ if length(regexall("DCGM_.*", custom_metric_name)) > 0 } - - type: External - external: - metric: - name: prometheus.googleapis.com|${lower(custom_metric_name)}|unknown - target: - type: AverageValue - averageValue: ${hpa_averagevalue_target} -%{ else } - type: Pods pods: metric: @@ -27,4 +18,3 @@ spec: target: type: AverageValue averageValue: ${hpa_averagevalue_target} -%{ endif } diff --git a/benchmarks/inference-server/vllm/variables.tf b/benchmarks/inference-server/vllm/variables.tf index 71ff800ee..a59e4726f 100644 --- a/benchmarks/inference-server/vllm/variables.tf +++ b/benchmarks/inference-server/vllm/variables.tf @@ -107,15 +107,13 @@ variable "project_id" { type = string } - - variable "hpa_type" { - description = "How the TGI workload should be scaled." + description = "How the vllm workload should be scaled." type = string default = null nullable = true validation { - condition = var.hpa_type == null ? true : length(regexall("cpu|vllm.*|DCGM_.*", var.hpa_type)) > 0 + condition = var.hpa_type == null ? true : length(regexall("vllm.*", var.hpa_type)) > 0 error_message = "Allows values for hpa_type are {null, or vLLM metrics (e.g., \"vllm:num_requests_waiting\", \"vllm:gpu_cache_usage_perc\")}" } }