magic_model.py 1.4 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849
  1. class MagicModel():
  2. """
  3. 每个函数没有得到元素的时候返回空list
  4. """
  5. def __fix_axis():
  6. # TODO 计算
  7. self.__model_list = xx
  8. def __init__(model_list:list, page:Page):
  9. self.__model_list = model_list
  10. self.__fix_axis()
  11. self.__page = page
  12. def get_imgs(self, page_no:int): # @许瑞
  13. return_lst = []
  14. img = {
  15. "bbox":[x0,y0,x1,y1]
  16. }
  17. img_caption = {
  18. "bbox":[x0,y0,x1,y1],
  19. "text":"",
  20. }
  21. return [{"img":img, "caption":img_caption},]
  22. def get_tables(self, page_no:int) ->list: # 3个坐标, caption, table主体,table-note
  23. pass # 许瑞
  24. def get_equations(self, page_no:int)->list: # 有坐标,也有字
  25. return inline_equations, interline_equations # @凯文
  26. def get_discarded(self, page_no:int)->list: # 自研模型,只有坐标
  27. pass # @凯文
  28. def get_text_blocks(self, page_no:int)->list: # 自研模型搞的,只有坐标,没有字
  29. pass # @凯文
  30. def get_title_blocks(self, page_no:int)->list: # 自研模型,只有坐标,没字
  31. pass # @凯文
  32. def get_ocr_text(self, page_no:int)->list: # paddle 搞的,有字也有坐标
  33. pass # @小蒙
  34. def get_ocr_spans(self, page_no:int)->list:
  35. pass # @小蒙