enum_class.py 3.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132
  1. from enum import Enum
  2. class BlockType:
  3. IMAGE = 'image'
  4. TABLE = 'table'
  5. IMAGE_BODY = 'image_body'
  6. TABLE_BODY = 'table_body'
  7. IMAGE_CAPTION = 'image_caption'
  8. TABLE_CAPTION = 'table_caption'
  9. IMAGE_FOOTNOTE = 'image_footnote'
  10. TABLE_FOOTNOTE = 'table_footnote'
  11. TEXT = 'text'
  12. TITLE = 'title'
  13. INTERLINE_EQUATION = 'interline_equation'
  14. LIST = 'list'
  15. INDEX = 'index'
  16. DISCARDED = 'discarded'
  17. # Added in vlm 2.5
  18. CODE = "code"
  19. CODE_BODY = "code_body"
  20. CODE_CAPTION = "code_caption"
  21. ALGORITHM = "algorithm"
  22. REF_TEXT = "ref_text"
  23. PHONETIC = "phonetic"
  24. HEADER = "header"
  25. FOOTER = "footer"
  26. PAGE_NUMBER = "page_number"
  27. ASIDE_TEXT = "aside_text"
  28. PAGE_FOOTNOTE = "page_footnote"
  29. class ContentType:
  30. IMAGE = 'image'
  31. TABLE = 'table'
  32. TEXT = 'text'
  33. INTERLINE_EQUATION = 'interline_equation'
  34. INLINE_EQUATION = 'inline_equation'
  35. EQUATION = 'equation'
  36. CODE = 'code'
  37. class ContentTypeV2:
  38. CODE = 'code'
  39. ALGORITHM = "algorithm"
  40. EQUATION_INTERLINE = 'equation_interline'
  41. IMAGE = 'image'
  42. TABLE = 'table'
  43. TABLE_SIMPLE = 'simple_table'
  44. TABLE_COMPLEX = 'complex_table'
  45. LIST = 'list'
  46. LIST_TEXT = 'text_list'
  47. LIST_REF = 'reference_list'
  48. TITLE = 'title'
  49. PARAGRAPH = 'paragraph'
  50. SPAN_TEXT = 'text'
  51. SPAN_EQUATION_INLINE = 'equation_inline'
  52. SPAN_PHONETIC = 'phonetic'
  53. SPAN_MD = 'md'
  54. SPAN_CODE_INLINE = 'code_inline'
  55. PAGE_HEADER = "page_header"
  56. PAGE_FOOTER = "page_footer"
  57. PAGE_NUMBER = "page_number"
  58. PAGE_ASIDE_TEXT = "page_aside_text"
  59. PAGE_FOOTNOTE = "page_footnote"
  60. class CategoryId:
  61. Title = 0
  62. Text = 1
  63. Abandon = 2
  64. ImageBody = 3
  65. ImageCaption = 4
  66. TableBody = 5
  67. TableCaption = 6
  68. TableFootnote = 7
  69. InterlineEquation_Layout = 8
  70. InterlineEquationNumber_Layout = 9
  71. InlineEquation = 13
  72. InterlineEquation_YOLO = 14
  73. OcrText = 15
  74. LowScoreText = 16
  75. ImageFootnote = 101
  76. class MakeMode:
  77. MM_MD = 'mm_markdown'
  78. NLP_MD = 'nlp_markdown'
  79. CONTENT_LIST = 'content_list'
  80. CONTENT_LIST_V2 = 'content_list_v2'
  81. class ModelPath:
  82. vlm_root_hf = "opendatalab/MinerU2.5-2509-1.2B"
  83. vlm_root_modelscope = "OpenDataLab/MinerU2.5-2509-1.2B"
  84. pipeline_root_modelscope = "OpenDataLab/PDF-Extract-Kit-1.0"
  85. pipeline_root_hf = "opendatalab/PDF-Extract-Kit-1.0"
  86. doclayout_yolo = "models/Layout/YOLO/doclayout_yolo_docstructbench_imgsz1280_2501.pt"
  87. yolo_v8_mfd = "models/MFD/YOLO/yolo_v8_ft.pt"
  88. unimernet_small = "models/MFR/unimernet_hf_small_2503"
  89. pp_formulanet_plus_m = "models/MFR/pp_formulanet_plus_m"
  90. pytorch_paddle = "models/OCR/paddleocr_torch"
  91. layout_reader = "models/ReadingOrder/layout_reader"
  92. slanet_plus = "models/TabRec/SlanetPlus/slanet-plus.onnx"
  93. unet_structure = "models/TabRec/UnetStructure/unet.onnx"
  94. paddle_table_cls = "models/TabCls/paddle_table_cls/PP-LCNet_x1_0_table_cls.onnx"
  95. paddle_orientation_classification = "models/OriCls/paddle_orientation_classification/PP-LCNet_x1_0_doc_ori.onnx"
  96. class SplitFlag:
  97. CROSS_PAGE = 'cross_page'
  98. LINES_DELETED = 'lines_deleted'
  99. class ImageType:
  100. PIL = 'pil_img'
  101. BASE64 = 'base64_img'
  102. class NotExtractType(Enum):
  103. TEXT = BlockType.TEXT
  104. TITLE = BlockType.TITLE
  105. HEADER = BlockType.HEADER
  106. FOOTER = BlockType.FOOTER
  107. PAGE_NUMBER = BlockType.PAGE_NUMBER
  108. PAGE_FOOTNOTE = BlockType.PAGE_FOOTNOTE
  109. REF_TEXT = BlockType.REF_TEXT
  110. TABLE_CAPTION = BlockType.TABLE_CAPTION
  111. IMAGE_CAPTION = BlockType.IMAGE_CAPTION
  112. TABLE_FOOTNOTE = BlockType.TABLE_FOOTNOTE
  113. IMAGE_FOOTNOTE = BlockType.IMAGE_FOOTNOTE
  114. CODE_CAPTION = BlockType.CODE_CAPTION