Skip to content

Commit

Permalink
fix readme
Browse files Browse the repository at this point in the history
  • Loading branch information
kaushikmitr committed Mar 8, 2024
1 parent 1e1f393 commit 904a233
Show file tree
Hide file tree
Showing 3 changed files with 7 additions and 4 deletions.
7 changes: 5 additions & 2 deletions benchmarks/inference-server/triton/main.tf
Original file line number Diff line number Diff line change
Expand Up @@ -15,17 +15,20 @@
*/

locals {
template_path = var.gcs_model_path == null

template_path = (
var.gcs_model_path == null
? "${path.module}/manifest-templates/triton-tensorrtllm-inference-docker.tftpl"
: "${path.module}/manifest-templates/triton-tensorrtllm-inference-gs.tftpl"
)
}

resource "kubernetes_manifest" "default" {
manifest = yamldecode(templatefile(local.template_path, {
namespace = var.namespace
ksa = var.ksa
image_path = var.image_path
huggingface-secret = var.huggingface-secret
huggingface_secret = var.huggingface_secret
gpu_count = var.gpu_count
model_id = var.model_id
gcs_model_path = var.gcs_model_path
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -50,7 +50,7 @@ spec:
- name: HUGGINGFACE_TOKEN
valueFrom:
secretKeyRef:
name: ${huggingface-secret}
name: ${huggingface_secret}
key: token
resources:
limits:
Expand Down
2 changes: 1 addition & 1 deletion benchmarks/inference-server/triton/variables.tf
Original file line number Diff line number Diff line change
Expand Up @@ -68,7 +68,7 @@ variable "ksa" {
default = "default"
}

variable "huggingface-secret" {
variable "huggingface_secret" {
description = "name of the kubectl huggingface secret token"
type = string
nullable = true
Expand Down

0 comments on commit 904a233

Please sign in to comment.