|
@@ -40,13 +40,13 @@ model_name="DotsOCR"
|
|
|
vllm serve ${hf_model_path} \
|
|
vllm serve ${hf_model_path} \
|
|
|
--host 0.0.0.0 \
|
|
--host 0.0.0.0 \
|
|
|
--port 8101 \
|
|
--port 8101 \
|
|
|
- --gpu-memory-utilization 0.90 \
|
|
|
|
|
|
|
+ --gpu-memory-utilization 0.85 \
|
|
|
--max-log-len 1000 \
|
|
--max-log-len 1000 \
|
|
|
--trust-remote-code \
|
|
--trust-remote-code \
|
|
|
--max-model-len 65536 \
|
|
--max-model-len 65536 \
|
|
|
--max-num-batched-tokens 65536 \
|
|
--max-num-batched-tokens 65536 \
|
|
|
--uvicorn-log-level info \
|
|
--uvicorn-log-level info \
|
|
|
- --limit-mm-per-prompt '{"image": 5}' \
|
|
|
|
|
|
|
+ --limit-mm-per-prompt '{"image": 3}' \
|
|
|
--chat-template-content-format string \
|
|
--chat-template-content-format string \
|
|
|
--data-parallel-size 3 \
|
|
--data-parallel-size 3 \
|
|
|
--max-num-seqs 32 \
|
|
--max-num-seqs 32 \
|