File tree Expand file tree Collapse file tree
zh/get_started/installation Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -480,7 +480,7 @@ python3 -m fastdeploy.entrypoints.openai.api_server \
480480 --cache-queue-port 55660 \
481481 --max-model-len 16384 \
482482 --max-num-batched-tokens 16384 \
483- --max-num-seqs 32 \
483+ --max-num-seqs 64 \
484484 --workers 2 \
485485 --block-size 16
486486```
Original file line number Diff line number Diff line change @@ -480,7 +480,7 @@ python3 -m fastdeploy.entrypoints.openai.api_server \
480480 --cache-queue-port 55660 \
481481 --max-model-len 16384 \
482482 --max-num-batched-tokens 16384 \
483- --max-num-seqs 32 \
483+ --max-num-seqs 64 \
484484 --workers 2 \
485485 --block-size 16
486486```
Original file line number Diff line number Diff line change @@ -577,6 +577,10 @@ def _start_worker_service(self):
577577 if self .cfg .structured_outputs_config .logits_processors is not None :
578578 arguments += f" --logits-processors { ' ' .join (self .cfg .structured_outputs_config .logits_processors )} "
579579
580+ # TODO (iluvatar): remove aftet paddle fix launch error
581+ if current_platform .is_iluvatar () and "CUDA_VISIBLE_DEVICES" in os .environ :
582+ arguments = arguments .replace (f"--devices { self .cfg .parallel_config .device_ids } " , "" )
583+
580584 worker_store_true_flag = {
581585 "enable_expert_parallel" : self .cfg .parallel_config .enable_expert_parallel ,
582586 "enable_chunked_moe" : self .cfg .parallel_config .enable_chunked_moe ,
Original file line number Diff line number Diff line change @@ -14,8 +14,8 @@ ln -sf /usr/local/bin/python3 /usr/local/bin/python
1414echo " pip requirements"
1515python -m pip install -r requirements_iluvatar.txt
1616echo " install paddle cpu and custom device"
17- python -m pip install paddlepaddle==3.3.0.dev20251103 -i https://www.paddlepaddle.org.cn/packages/nightly/cpu/
18- python -m pip install paddle-iluvatar-gpu==3.0.0.dev20251107 -i https://www.paddlepaddle.org.cn/packages/nightly/ixuca/
17+ python -m pip install paddlepaddle==3.3.0.dev20251219 -i https://www.paddlepaddle.org.cn/packages/nightly/cpu/
18+ python -m pip install paddle-iluvatar-gpu==3.0.0.dev20251219 -i https://www.paddlepaddle.org.cn/packages/nightly/ixuca/
1919echo " build whl"
2020bash build.sh || exit 1
2121
You can’t perform that action at this time.
0 commit comments