Skip to content

Commit

Permalink
fix readme
Browse files Browse the repository at this point in the history
  • Loading branch information
kaushikmitr committed Mar 8, 2024
1 parent f983f7d commit 1f22e32
Show file tree
Hide file tree
Showing 2 changed files with 9 additions and 9 deletions.
10 changes: 5 additions & 5 deletions benchmarks/inference-server/triton/main.tf
Original file line number Diff line number Diff line change
Expand Up @@ -14,12 +14,12 @@
* limitations under the License.
*/

locals {
locals {

template_path = (
var.gcs_model_path == null
? "${path.module}/manifest-templates/triton-tensorrtllm-inference-docker.tftpl"
: "${path.module}/manifest-templates/triton-tensorrtllm-inference-gs.tftpl"
var.gcs_model_path == null
? "${path.module}/manifest-templates/triton-tensorrtllm-inference-docker.tftpl"
: "${path.module}/manifest-templates/triton-tensorrtllm-inference-gs.tftpl"
)
}

Expand Down
8 changes: 4 additions & 4 deletions benchmarks/inference-server/triton/sample-terraform.tfvars
Original file line number Diff line number Diff line change
Expand Up @@ -2,8 +2,8 @@ credentials_config = {
fleet_host = "https://connectgateway.googleapis.com/v1/projects/$PROJECT_NUMBER/locations/global/gkeMemberships/ai-benchmark"
}

namespace = "benchmark"
ksa = "benchmark-ksa"
model_id = "meta-llama/Llama-2-7b-chat-hf"
gpu_count = 1
namespace = "benchmark"
ksa = "benchmark-ksa"
model_id = "meta-llama/Llama-2-7b-chat-hf"
gpu_count = 1
gcs_model_path = ""

0 comments on commit 1f22e32

Please sign in to comment.