readd container folder

GoogleCloudPlatform · Aug 23, 2024 · f1d56d6 · f1d56d6
1 parent 2ab541f
commit f1d56d6
Show file tree

Hide file tree

Showing 5 changed files with 555 additions and 0 deletions.
diff --git a/benchmarks/benchmark/tools/profile-generator/container/Dockerfile b/benchmarks/benchmark/tools/profile-generator/container/Dockerfile
@@ -0,0 +1,21 @@
+FROM nvidia/cuda:12.1.0-devel-ubuntu22.04 AS dev
+
+RUN apt-get update -y \
+    && apt-get install -y python3-pip git vim curl wget
+RUN pip3 install --upgrade pip
+RUN pip install packaging torch transformers
+WORKDIR /workspace
+
+# install build and runtime dependencies
+COPY requirements.txt requirements.txt
+RUN pip install -r requirements.txt
+
+RUN pip install -U "huggingface_hub[cli]"
+
+RUN wget https://huggingface.co/datasets/anon8231489123/ShareGPT_Vicuna_unfiltered/resolve/main/ShareGPT_V3_unfiltered_cleaned_split.json
+
+COPY benchmark_serving.py benchmark_serving.py
+COPY latency_throughput_curve.sh latency_throughput_curve.sh
+
+RUN chmod +x latency_throughput_curve.sh
+RUN chmod +x benchmark_serving.py