-
Notifications
You must be signed in to change notification settings - Fork 0
/
docker-compose.yml
52 lines (52 loc) · 1.22 KB
/
docker-compose.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
---
version: '3.4'
services:
t2v-transformers-rs-gpu:
build:
context: .
dockerfile: Dockerfile.gpu
target: release
args:
- MODEL_NAME: "BAAI/bge-small-en-v1.5"
- TARGETARCH: "arm64"
- CUDA_VERSION: "12.4.1"
ports:
- 3000:3000
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: 1
capabilities: [gpu]
t2v-transformers-rs-cpu:
build:
context: .
dockerfile: Dockerfile.cpu
target: release
args:
- MODEL_NAME: "BAAI/bge-small-en-v1.5"
- TARGETARCH: "arm64"
ports:
- 3000:3000
t2v-transformers-py-gpu:
image: semitechnologies/transformers-inference:baai-bge-small-en-v1.5
ports:
- 8080:8080
environment:
ENABLE_CUDA: "true"
T2V_TRANSFORMERS_DIRECT_TOKENIZE: "true"
deploy:
resources:
reservations:
devices:
- driver: nvidia
count: 1
capabilities: [gpu]
t2v-transformers-py-cpu:
image: semitechnologies/transformers-inference:baai-bge-small-en-v1.5-onnx
ports:
- 8080:8080
environment:
T2V_TRANSFORMERS_DIRECT_TOKENIZE: "true"
...