test_table_recognition.py 1.5 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849
  1. # Copyright (c) 2024 PaddlePaddle Authors. All Rights Reserved.
  2. #
  3. # Licensed under the Apache License, Version 2.0 (the "License");
  4. # you may not use this file except in compliance with the License.
  5. # You may obtain a copy of the License at
  6. #
  7. # http://www.apache.org/licenses/LICENSE-2.0
  8. #
  9. # Unless required by applicable law or agreed to in writing, software
  10. # distributed under the License is distributed on an "AS IS" BASIS,
  11. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. # See the License for the specific language governing permissions and
  13. # limitations under the License.
  14. from paddlex import create_pipeline
  15. pipeline = create_pipeline(pipeline="table_recognition")
  16. output = pipeline.predict(
  17. "./test_samples/table_recognition.jpg",
  18. use_doc_orientation_classify=False,
  19. use_doc_unwarping=False,
  20. )
  21. # output = pipeline.predict(
  22. # "./test_samples/table_recognition.jpg",
  23. # use_doc_orientation_classify=True,
  24. # use_doc_unwarping=True
  25. # )
  26. # output = pipeline.predict(
  27. # "./test_samples/table_recognition.jpg",
  28. # use_doc_orientation_classify=False,
  29. # use_doc_unwarping=False,
  30. # use_layout_detection=False
  31. # )
  32. # output = pipeline.predict(
  33. # "./test_samples/table_recognition.jpg"
  34. # )
  35. # output = pipeline("./test_samples/财报1.pdf")
  36. for res in output:
  37. print(res)
  38. res.print()
  39. res.save_to_img("./output")
  40. res.save_to_json("./output")
  41. res.save_to_xlsx("./output")
  42. res.save_to_html("./output")