Update README.md
Browse files
README.md
CHANGED
|
@@ -322,7 +322,7 @@ MODEL=your/mode/path
|
|
| 322 |
export ATTENTION_BACKEND=FLASH_ATTN_VLLM_V1
|
| 323 |
VLLM_USE_V1=1 VLLM_ATTENTION_BACKEND=${ATTENTION_BACKEND} CUDA_VISIBLE_DEVICES=0,1 python -m vllm.entrypoints.openai.api_server \
|
| 324 |
--seed 20250525 \
|
| 325 |
-
--port ${
|
| 326 |
--allowed-local-media-path $ALLOWED_LOCAL_MEDIA_PATH \
|
| 327 |
--max-model-len 8192 \
|
| 328 |
--max-num-batched-tokens 8192 \
|
|
|
|
| 322 |
export ATTENTION_BACKEND=FLASH_ATTN_VLLM_V1
|
| 323 |
VLLM_USE_V1=1 VLLM_ATTENTION_BACKEND=${ATTENTION_BACKEND} CUDA_VISIBLE_DEVICES=0,1 python -m vllm.entrypoints.openai.api_server \
|
| 324 |
--seed 20250525 \
|
| 325 |
+
--port ${PORT} \
|
| 326 |
--allowed-local-media-path $ALLOWED_LOCAL_MEDIA_PATH \
|
| 327 |
--max-model-len 8192 \
|
| 328 |
--max-num-batched-tokens 8192 \
|