Skip to content

Commit 425205b

Browse files
authored
[Doc] fix the port conflict issue in the usage example (#4379)
1 parent 2d64107 commit 425205b

File tree

5 files changed

+6
-6
lines changed

5 files changed

+6
-6
lines changed

docs/get_started/ernie-4.5-vl.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@ export ENABLE_V1_KVCACHE_SCHEDULER=1
2727
python -m fastdeploy.entrypoints.openai.api_server \
2828
--model baidu/ERNIE-4.5-VL-424B-A47B-Paddle \
2929
--port 8180 --engine-worker-queue-port 8181 \
30-
--cache-queue-port 8182 --metrics-port 8182 \
30+
--cache-queue-port 8183 --metrics-port 8182 \
3131
--tensor-parallel-size 8 \
3232
--quantization wint4 \
3333
--max-model-len 32768 \

docs/get_started/ernie-4.5.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@ export ENABLE_V1_KVCACHE_SCHEDULER=1
2525
python -m fastdeploy.entrypoints.openai.api_server \
2626
--model baidu/ERNIE-4.5-300B-A47B-Paddle \
2727
--port 8180 --engine-worker-queue-port 8181 \
28-
--cache-queue-port 8182 --metrics-port 8182 \
28+
--cache-queue-port 8183 --metrics-port 8182 \
2929
--tensor-parallel-size 8 \
3030
--quantization wint4 \
3131
--max-model-len 32768 \

docs/zh/get_started/ernie-4.5-vl.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,7 @@ export ENABLE_V1_KVCACHE_SCHEDULER=1
2727
python -m fastdeploy.entrypoints.openai.api_server \
2828
--model baidu/ERNIE-4.5-VL-424B-A47B-Paddle \
2929
--port 8180 --engine-worker-queue-port 8181 \
30-
--cache-queue-port 8182 --metrics-port 8182 \
30+
--cache-queue-port 8183 --metrics-port 8182 \
3131
--tensor-parallel-size 8 \
3232
--quantization wint4 \
3333
--max-model-len 32768 \

docs/zh/get_started/ernie-4.5.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@ export ENABLE_V1_KVCACHE_SCHEDULER=1
2525
python -m fastdeploy.entrypoints.openai.api_server \
2626
--model baidu/ERNIE-4.5-300B-A47B-Paddle \
2727
--port 8180 --engine-worker-queue-port 8181 \
28-
--cache-queue-port 8182 --metrics-port 8182 \
28+
--cache-queue-port 8183 --metrics-port 8182 \
2929
--tensor-parallel-size 8 \
3030
--quantization wint4 \
3131
--max-model-len 32768 \

docs/zh/quantization/online_quantization.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@
1515
python -m fastdeploy.entrypoints.openai.api_server \
1616
--model baidu/ERNIE-4.5-300B-A47B-Paddle \
1717
--port 8180 --engine-worker-queue-port 8181 \
18-
--cache-queue-port 8182 --metrics-port 8182 \
18+
--cache-queue-port 8183 --metrics-port 8182 \
1919
--tensor-parallel-size 8 \
2020
--quantization wint8 \
2121
--max-model-len 32768 \
@@ -41,7 +41,7 @@ python -m fastdeploy.entrypoints.openai.api_server \
4141
python -m fastdeploy.entrypoints.openai.api_server \
4242
--model baidu/ERNIE-4.5-300B-A47B-Paddle \
4343
--port 8180 --engine-worker-queue-port 8181 \
44-
--cache-queue-port 8182 --metrics-port 8182 \
44+
--cache-queue-port 8183 --metrics-port 8182 \
4545
--tensor-parallel-size 8 \
4646
--quantization block_wise_fp8 \
4747
--max-model-len 32768 \

0 commit comments

Comments
 (0)