2 miesięcy temu · d26ce1df8c
--- a/zhch/launch_model_vllm.sh
+++ b/zhch/launch_model_vllm.sh
@@ -40,13 +40,13 @@ model_name="DotsOCR"
 
															 vllm serve ${hf_model_path} \
														
 
															     --host 0.0.0.0 \
														
 
															     --port 8101 \
														
 
															-    --gpu-memory-utilization 0.90 \
														
 
															+    --gpu-memory-utilization 0.85 \
														
 
															     --max-log-len 1000 \
														
 
															     --trust-remote-code \
														
 
															 	--max-model-len 65536 \
														
 
															 	--max-num-batched-tokens 65536 \
														
 
															     --uvicorn-log-level info \
														
 
															-    --limit-mm-per-prompt '{"image": 5}' \
														
 
															+    --limit-mm-per-prompt '{"image": 3}' \
														
 
															     --chat-template-content-format string \
														
 
															     --data-parallel-size 3 \
														
 
															     --max-num-seqs 32 \