From c5a46693925c9638d288b05eb758bcf8fd22b599 Mon Sep 17 00:00:00 2001 From: Alvaro Bartolome <36760800+alvarobartt@users.noreply.github.com> Date: Tue, 17 Sep 2024 11:14:43 +0200 Subject: [PATCH] Revert `image` on benchmarks until verified Included a harmless TODO note so that we remember to come back to this once the benchmark is verified with the latest Hugging Face DLC for TGI cc @annapendleton --- .../manifest-templates/text-generation-inference.tftpl | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/benchmarks/inference-server/text-generation-inference/manifest-templates/text-generation-inference.tftpl b/benchmarks/inference-server/text-generation-inference/manifest-templates/text-generation-inference.tftpl index 377b5bce0..eb7b46071 100644 --- a/benchmarks/inference-server/text-generation-inference/manifest-templates/text-generation-inference.tftpl +++ b/benchmarks/inference-server/text-generation-inference/manifest-templates/text-generation-inference.tftpl @@ -51,7 +51,7 @@ spec: - name: text-generation-inference ports: - containerPort: 80 - image: "us-docker.pkg.dev/deeplearning-platform-release/gcr.io/huggingface-text-generation-inference-cu121.2-2.ubuntu2204.py310" + image: "ghcr.io/huggingface/text-generation-inference:1.4.2" # TODO(annapendleton,alvarobartt): update to Hugging Face DLC once verified args: ["--model-id", "${model_id}", "--num-shard", "${gpu_count}", "--max-concurrent-requests", "${max_concurrent_requests}"] env: %{ for hugging_face_token_secret in hugging_face_token_secret_list ~}