We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents fce8d8a + 376e9d6 commit a9d1d49Copy full SHA for a9d1d49
doc/zh/DeepseekR1_tutorial_zh_for_Ascend_NPU.md
@@ -108,6 +108,8 @@ export TASK_QUEUE_ENABLE=0 # 保证算子下发顺序有序
108
export USE_MERGE=0
109
export INF_NAN_MODE_FORCE_DISABLE=1
110
export TASK_QUEUE_ENABLE=0
111
+export RANK=0
112
+export LOCAL_WORLD_SIZE=1
113
#export PROF_DECODE=1
114
#export PROF_PREFILL=1
115
@@ -116,7 +118,6 @@ source /usr/local/Ascend/nnal/atb/set_env.sh
116
118
117
119
python ktransformers/server/main.py \
120
--port 10002 \
-
121
--model_path /mnt/data/models/DeepSeek-R1-q4km-w8a8 \
122
--gguf_path /mnt/data/models/DeepSeek-R1-q4km-w8a8 \
123
--model_name DeepSeekV3ForCausalLM \
0 commit comments