paddleocr_vl_09b.py 1.4 KB

12345678910111213141516171819202122232425262728293031323334353637383940
  1. # Copyright (c) 2025 PaddlePaddle Authors. All Rights Reserved.
  2. #
  3. # Licensed under the Apache License, Version 2.0 (the "License");
  4. # you may not use this file except in compliance with the License.
  5. # You may obtain a copy of the License at
  6. #
  7. # http://www.apache.org/licenses/LICENSE-2.0
  8. #
  9. # Unless required by applicable law or agreed to in writing, software
  10. # distributed under the License is distributed on an "AS IS" BASIS,
  11. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. # See the License for the specific language governing permissions and
  13. # limitations under the License.
  14. def get_config(backend):
  15. if backend == "fastdeploy":
  16. return {
  17. "gpu-memory-utilization": 0.3,
  18. "max-model-len": 16384,
  19. "max-num-batched-tokens": 131072,
  20. "max-num-seqs": 256,
  21. }
  22. elif backend == "vllm":
  23. return {
  24. "trust-remote-code": True,
  25. "gpu-memory-utilization": 0.5,
  26. "max-model-len": 16384,
  27. "max-num-batched-tokens": 131072,
  28. "api-server-count": 4,
  29. }
  30. elif backend == "sglang":
  31. return {
  32. "trust-remote-code": True,
  33. "mem-fraction-static": 0.5,
  34. "context-length": 16384,
  35. "max-prefill-tokens": 131072,
  36. }
  37. else:
  38. raise ValueError(f"Unsupported backend: {backend}")