-
Notifications
You must be signed in to change notification settings - Fork 158
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
Showing
5 changed files
with
555 additions
and
0 deletions.
There are no files selected for viewing
21 changes: 21 additions & 0 deletions
21
benchmarks/benchmark/tools/profile-generator/container/Dockerfile
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,21 @@ | ||
FROM nvidia/cuda:12.1.0-devel-ubuntu22.04 AS dev | ||
|
||
RUN apt-get update -y \ | ||
&& apt-get install -y python3-pip git vim curl wget | ||
RUN pip3 install --upgrade pip | ||
RUN pip install packaging torch transformers | ||
WORKDIR /workspace | ||
|
||
# install build and runtime dependencies | ||
COPY requirements.txt requirements.txt | ||
RUN pip install -r requirements.txt | ||
|
||
RUN pip install -U "huggingface_hub[cli]" | ||
|
||
RUN wget https://huggingface.co/datasets/anon8231489123/ShareGPT_Vicuna_unfiltered/resolve/main/ShareGPT_V3_unfiltered_cleaned_split.json | ||
|
||
COPY benchmark_serving.py benchmark_serving.py | ||
COPY latency_throughput_curve.sh latency_throughput_curve.sh | ||
|
||
RUN chmod +x latency_throughput_curve.sh | ||
RUN chmod +x benchmark_serving.py |
Oops, something went wrong.